Mock Version: 5.9 Mock Version: 5.9 Mock Version: 5.9 ENTER ['do_with_status'](['bash', '--login', '-c', '/usr/bin/rpmbuild -bs --noclean --target x86_64 --nodeps /builddir/build/SPECS/rccl.spec'], chrootPath='/var/lib/mock/f42-build-55706471-6538073/root'env={'TERM': 'vt100', 'SHELL': '/bin/bash', 'HOME': '/builddir', 'HOSTNAME': 'mock', 'PATH': '/usr/bin:/bin:/usr/sbin:/sbin', 'PROMPT_COMMAND': 'printf "\\033]0;\\007"', 'PS1': ' \\s-\\v\\$ ', 'LANG': 'C.UTF-8'}shell=Falselogger=timeout=201600uid=1000gid=425user='mockbuild'unshare_net=TrueprintOutput=Falsenspawn_args=['--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.vcer5xhi:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11']) Using nspawn with args ['--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.vcer5xhi:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11'] Executing command: ['/usr/bin/systemd-nspawn', '-q', '-M', 'd2cfb4d08062499baa8ec9b00a5f505d', '-D', '/var/lib/mock/f42-build-55706471-6538073/root', '-a', '-u', 'mockbuild', '--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.vcer5xhi:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11', '--console=pipe', '--setenv=TERM=vt100', '--setenv=SHELL=/bin/bash', '--setenv=HOME=/builddir', '--setenv=HOSTNAME=mock', '--setenv=PATH=/usr/bin:/bin:/usr/sbin:/sbin', '--setenv=PROMPT_COMMAND=printf "\\033]0;\\007"', '--setenv=PS1= \\s-\\v\\$ ', '--setenv=LANG=C.UTF-8', '--resolv-conf=off', 'bash', '--login', '-c', '/usr/bin/rpmbuild -bs --noclean --target x86_64 --nodeps /builddir/build/SPECS/rccl.spec'] with env {'TERM': 'vt100', 'SHELL': '/bin/bash', 'HOME': '/builddir', 'HOSTNAME': 'mock', 'PATH': '/usr/bin:/bin:/usr/sbin:/sbin', 'PROMPT_COMMAND': 'printf "\\033]0;\\007"', 'PS1': ' \\s-\\v\\$ ', 'LANG': 'C.UTF-8', 'SYSTEMD_NSPAWN_TMPFS_TMP': '0', 'SYSTEMD_SECCOMP': '0'} and shell False Building target platforms: x86_64 Building for target x86_64 setting SOURCE_DATE_EPOCH=1727308800 Wrote: /builddir/build/SRPMS/rccl-6.2.1-1.fc42.src.rpm Child return code was: 0 ENTER ['do_with_status'](['bash', '--login', '-c', '/usr/bin/rpmbuild -bb --noclean --target x86_64 --nodeps /builddir/build/SPECS/rccl.spec'], chrootPath='/var/lib/mock/f42-build-55706471-6538073/root'env={'TERM': 'vt100', 'SHELL': '/bin/bash', 'HOME': '/builddir', 'HOSTNAME': 'mock', 'PATH': '/usr/bin:/bin:/usr/sbin:/sbin', 'PROMPT_COMMAND': 'printf "\\033]0;\\007"', 'PS1': ' \\s-\\v\\$ ', 'LANG': 'C.UTF-8'}shell=Falselogger=timeout=201600uid=1000gid=425user='mockbuild'unshare_net=TrueprintOutput=Falsenspawn_args=['--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.vcer5xhi:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11']) Using nspawn with args ['--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.vcer5xhi:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11'] Executing command: ['/usr/bin/systemd-nspawn', '-q', '-M', '2d2fd6b0534047fbbc531e2c72c9db62', '-D', '/var/lib/mock/f42-build-55706471-6538073/root', '-a', '-u', 'mockbuild', '--capability=cap_ipc_lock', '--bind=/tmp/mock-resolv.vcer5xhi:/etc/resolv.conf', '--bind=/dev/btrfs-control', '--bind=/dev/mapper/control', '--bind=/dev/fuse', '--bind=/dev/loop-control', '--bind=/dev/loop0', '--bind=/dev/loop1', '--bind=/dev/loop2', '--bind=/dev/loop3', '--bind=/dev/loop4', '--bind=/dev/loop5', '--bind=/dev/loop6', '--bind=/dev/loop7', '--bind=/dev/loop8', '--bind=/dev/loop9', '--bind=/dev/loop10', '--bind=/dev/loop11', '--console=pipe', '--setenv=TERM=vt100', '--setenv=SHELL=/bin/bash', '--setenv=HOME=/builddir', '--setenv=HOSTNAME=mock', '--setenv=PATH=/usr/bin:/bin:/usr/sbin:/sbin', '--setenv=PROMPT_COMMAND=printf "\\033]0;\\007"', '--setenv=PS1= \\s-\\v\\$ ', '--setenv=LANG=C.UTF-8', '--resolv-conf=off', 'bash', '--login', '-c', '/usr/bin/rpmbuild -bb --noclean --target x86_64 --nodeps /builddir/build/SPECS/rccl.spec'] with env {'TERM': 'vt100', 'SHELL': '/bin/bash', 'HOME': '/builddir', 'HOSTNAME': 'mock', 'PATH': '/usr/bin:/bin:/usr/sbin:/sbin', 'PROMPT_COMMAND': 'printf "\\033]0;\\007"', 'PS1': ' \\s-\\v\\$ ', 'LANG': 'C.UTF-8', 'SYSTEMD_NSPAWN_TMPFS_TMP': '0', 'SYSTEMD_SECCOMP': '0'} and shell False Building target platforms: x86_64 Building for target x86_64 setting SOURCE_DATE_EPOCH=1727308800 Executing(%mkbuilddir): /bin/sh -e /var/tmp/rpm-tmp.DY8Cvw + umask 022 + cd /builddir/build/BUILD/rccl-6.2.1-build + test -d /builddir/build/BUILD/rccl-6.2.1-build + /usr/bin/chmod -Rf a+rX,u+w,g-w,o-w /builddir/build/BUILD/rccl-6.2.1-build + /usr/bin/rm -rf /builddir/build/BUILD/rccl-6.2.1-build + /usr/bin/mkdir -p /builddir/build/BUILD/rccl-6.2.1-build + /usr/bin/mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/SPECPARTS + RPM_EC=0 ++ jobs -p + exit 0 Executing(%prep): /bin/sh -e /var/tmp/rpm-tmp.zkXZBQ + umask 022 + cd /builddir/build/BUILD/rccl-6.2.1-build + cd /builddir/build/BUILD/rccl-6.2.1-build + rm -rf rccl-rocm-6.2.1 + /usr/lib/rpm/rpmuncompress -x /builddir/build/SOURCES/RCCL-6.2.1.tar.gz + STATUS=0 + '[' 0 -ne 0 ']' + cd rccl-rocm-6.2.1 + /usr/bin/chmod -Rf a+rX,u+w,g-w,o-w . + sed -i -e '/AMD GPU targets to compile for/d' CMakeLists.txt + sed -i -e /parallel-jobs/d CMakeLists.txt + sed -i -e 's@cat ${ROCM_PATH}/.info/version@echo 6.2.1@' CMakeLists.txt + RPM_EC=0 ++ jobs -p + exit 0 Executing(%build): /bin/sh -e /var/tmp/rpm-tmp.wc12qt + umask 022 + cd /builddir/build/BUILD/rccl-6.2.1-build + CFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer ' + export CFLAGS + CXXFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer' + export CXXFLAGS + FFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FFLAGS + FCFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FCFLAGS + VALAFLAGS=-g + export VALAFLAGS + RUSTFLAGS='-Copt-level=3 -Cdebuginfo=2 -Ccodegen-units=1 -Cstrip=none -Cforce-frame-pointers=yes -Clink-arg=-specs=/usr/lib/rpm/redhat/redhat-package-notes --cap-lints=warn' + export RUSTFLAGS + LDFLAGS='-Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes ' + export LDFLAGS + LT_SYS_LIBRARY_PATH=/usr/lib64: + export LT_SYS_LIBRARY_PATH + CC=hipcc + export CC + CXX=hipcc + export CXX + cd rccl-rocm-6.2.1 + for gpu in gfx9 gfx11 gfx90a gfx942 gfx1100 + module load rocm/gfx9 + local _mlredir=0 + '[' -n '' ']' + case " $@ " in + '[' 0 -eq 0 ']' + _module_raw load rocm/gfx9 ++ /usr/bin/tclsh /usr/share/Modules/libexec/modulecmd.tcl bash load rocm/gfx9 + eval 'LD_LIBRARY_PATH=/usr/lib64/rocm/gfx9/lib; export LD_LIBRARY_PATH; __MODULES_LMCONFLICT=rocm/gfx9\&rocm; export __MODULES_LMCONFLICT; PATH=/usr/lib64/rocm/gfx9/bin:/usr/share/Modules/bin:/usr/bin:/bin:/usr/sbin:/sbin:/usr/local/sbin; export PATH; ROCM_BIN=/usr/lib64/rocm/gfx9/bin; export ROCM_BIN; _LMFILES_=/usr/share/modulefiles/rocm/gfx9; export _LMFILES_; LOADEDMODULES=rocm/gfx9; export LOADEDMODULES; PYTHONPATH=/usr/lib64/rocm/gfx9/lib64/python3.13/site-packages/; export PYTHONPATH; ROCM_GPUS=gfx900\;gfx906:xnack-\;gfx908:xnack-\;gfx90a:xnack+\;gfx90a:xnack-\;gfx942; export ROCM_GPUS; ROCM_LIB=/usr/lib64/rocm/gfx9/lib; export ROCM_LIB; test 0;' ++ LD_LIBRARY_PATH=/usr/lib64/rocm/gfx9/lib ++ export LD_LIBRARY_PATH ++ __MODULES_LMCONFLICT='rocm/gfx9&rocm' ++ export __MODULES_LMCONFLICT ++ PATH=/usr/lib64/rocm/gfx9/bin:/usr/share/Modules/bin:/usr/bin:/bin:/usr/sbin:/sbin:/usr/local/sbin ++ export PATH ++ ROCM_BIN=/usr/lib64/rocm/gfx9/bin ++ export ROCM_BIN ++ _LMFILES_=/usr/share/modulefiles/rocm/gfx9 ++ export _LMFILES_ ++ LOADEDMODULES=rocm/gfx9 ++ export LOADEDMODULES ++ PYTHONPATH=/usr/lib64/rocm/gfx9/lib64/python3.13/site-packages/ ++ export PYTHONPATH ++ ROCM_GPUS='gfx900;gfx906:xnack-;gfx908:xnack-;gfx90a:xnack+;gfx90a:xnack-;gfx942' ++ export ROCM_GPUS ++ ROCM_LIB=/usr/lib64/rocm/gfx9/lib ++ export ROCM_LIB ++ test 0 + _mlstatus=0 + return 0 + CFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer ' + export CFLAGS + CXXFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer' + export CXXFLAGS + FFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FFLAGS + FCFLAGS='-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -I/usr/lib64/gfortran/modules ' + export FCFLAGS + VALAFLAGS=-g + export VALAFLAGS + RUSTFLAGS='-Copt-level=3 -Cdebuginfo=2 -Ccodegen-units=1 -Cstrip=none -Cforce-frame-pointers=yes -Clink-arg=-specs=/usr/lib/rpm/redhat/redhat-package-notes --cap-lints=warn' + export RUSTFLAGS + LDFLAGS='-Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes ' + export LDFLAGS + LT_SYS_LIBRARY_PATH=/usr/lib64: + export LT_SYS_LIBRARY_PATH + CC=hipcc + export CC + CXX=hipcc + export CXX + /usr/bin/cmake -S . -B redhat-linux-build-gfx9 -DCMAKE_C_FLAGS_RELEASE:STRING=-DNDEBUG -DCMAKE_CXX_FLAGS_RELEASE:STRING=-DNDEBUG -DCMAKE_Fortran_FLAGS_RELEASE:STRING=-DNDEBUG -DCMAKE_VERBOSE_MAKEFILE:BOOL=ON -DCMAKE_INSTALL_DO_STRIP:BOOL=OFF -DCMAKE_INSTALL_PREFIX:PATH=/usr -DINCLUDE_INSTALL_DIR:PATH=/usr/include -DLIB_INSTALL_DIR:PATH=/usr/lib64 -DSYSCONF_INSTALL_DIR:PATH=/etc -DSHARE_INSTALL_PREFIX:PATH=/usr/share -DLIB_SUFFIX=64 -DBUILD_SHARED_LIBS:BOOL=ON -G Ninja -DCMAKE_BUILD_TYPE=RelWithDebInfo -DCMAKE_SKIP_RPATH=ON -DBUILD_FILE_REORG_BACKWARD_COMPATIBILITY=OFF -DCMAKE_INSTALL_LIBDIR=/usr/lib64 -DROCM_SYMLINK_LIBS=OFF '-DAMDGPU_TARGETS=gfx900;gfx906:xnack-;gfx908:xnack-;gfx90a:xnack+;gfx90a:xnack-;gfx942' -DCMAKE_INSTALL_LIBDIR=/usr/lib64/rocm/gfx9/lib -DCMAKE_INSTALL_BINDIR=/usr/lib64/rocm/gfx9/bin -DBUILD_TESTS=OFF -DHIP_PLATFORM=amd CMake Deprecation Warning at CMakeLists.txt:6 (cmake_minimum_required): Compatibility with CMake < 3.10 will be removed from a future version of CMake. Update the VERSION argument value. Or, use the ... syntax to tell CMake that the project requires at least but has been updated to work with policies introduced by or earlier. -- CMAKE_TOOLCHAIN_FILE: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/toolchain-linux.cmake -- The CXX compiler identification is Clang 18.0.0 -- Detecting CXX compiler ABI info -- Detecting CXX compiler ABI info - done -- Check for working CXX compiler: /usr/bin/hipcc - skipped -- Detecting CXX compile features -- Detecting CXX compile features - done -- Could NOT find GTest (missing: GTEST_LIBRARY GTEST_INCLUDE_DIR GTEST_MAIN_LIBRARY) (Required is at least version "1.11") -- Checking for ROCm support for GPU targets: -- Performing Test COMPILER_HAS_TARGET_ID_gfx900 -- Performing Test COMPILER_HAS_TARGET_ID_gfx900 - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx906_xnack_off -- Performing Test COMPILER_HAS_TARGET_ID_gfx906_xnack_off - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx908_xnack_off -- Performing Test COMPILER_HAS_TARGET_ID_gfx908_xnack_off - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx90a_xnack_on -- Performing Test COMPILER_HAS_TARGET_ID_gfx90a_xnack_on - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx90a_xnack_off -- Performing Test COMPILER_HAS_TARGET_ID_gfx90a_xnack_off - Success -- Performing Test COMPILER_HAS_TARGET_ID_gfx942 -- Performing Test COMPILER_HAS_TARGET_ID_gfx942 - Success -- Compiling for gfx900;gfx906:xnack-;gfx908:xnack-;gfx90a:xnack+;gfx90a:xnack-;gfx942 -- Could NOT find GTest (missing: GTEST_LIBRARY GTEST_INCLUDE_DIR GTEST_MAIN_LIBRARY) (Required is at least version "1.11") -- ROCM_PATH found: /opt/rocm -- Performing Test CMAKE_HAVE_LIBC_PTHREAD -- Performing Test CMAKE_HAVE_LIBC_PTHREAD - Success -- Found Threads: TRUE -- Performing Test HIP_CLANG_SUPPORTS_PARALLEL_JOBS -- Performing Test HIP_CLANG_SUPPORTS_PARALLEL_JOBS - Success -- HIP compiler: clang -- HIP runtime: rocclr -- hipcc executable: /usr/bin/hipcc sh: line 1: /usr/bin/rocm_agent_enumerator: No such file or directory -- hipcc version: 6.3.42131 -- ROCm version: 6.2.1 ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:87 (string) /usr/share/cmake/Modules/CheckSymbolExists.cmake:71 (__CHECK_SYMBOL_EXISTS_FILTER_FLAGS) CMakeLists.txt:155 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:88 (string) /usr/share/cmake/Modules/CheckSymbolExists.cmake:71 (__CHECK_SYMBOL_EXISTS_FILTER_FLAGS) CMakeLists.txt:155 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* -- Looking for hipDeviceMallocUncached -- Looking for hipDeviceMallocUncached - found ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:99 (set) /usr/share/cmake/Modules/CheckSymbolExists.cmake:73 (__CHECK_SYMBOL_EXISTS_RESTORE_FLAGS) CMakeLists.txt:155 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* -- Looking for hipDeviceMallocContiguous ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:87 (string) /usr/share/cmake/Modules/CheckSymbolExists.cmake:71 (__CHECK_SYMBOL_EXISTS_FILTER_FLAGS) CMakeLists.txt:158 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:88 (string) /usr/share/cmake/Modules/CheckSymbolExists.cmake:71 (__CHECK_SYMBOL_EXISTS_FILTER_FLAGS) CMakeLists.txt:158 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* -- Looking for hipDeviceMallocContiguous - found ******************************************************************************* *------------------------------- ROCMChecks WARNING --------------------------* Options and properties should be set on a cmake target where possible. The variable 'CMAKE_CXX_FLAGS' may be set by the cmake toolchain, either by calling 'cmake -DCMAKE_CXX_FLAGS="-O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer"' or set in a toolchain file and added with 'cmake -DCMAKE_TOOLCHAIN_FILE='. ROCMChecks now calling: CMake Warning at /usr/share/rocmcmakebuildtools/cmake/ROCMChecks.cmake:46 (message): 'CMAKE_CXX_FLAGS' is set at /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/CMakeLists.txt: shown below: Call Stack (most recent call first): /usr/share/cmake/Modules/CheckSymbolExists.cmake:9223372036854775807 (rocm_check_toolchain_var) /usr/share/cmake/Modules/CheckSymbolExists.cmake:99 (set) /usr/share/cmake/Modules/CheckSymbolExists.cmake:73 (__CHECK_SYMBOL_EXISTS_RESTORE_FLAGS) CMakeLists.txt:158 (check_symbol_exists) *-----------------------------------------------------------------------------* ******************************************************************************* -- HSA runtime: /usr/include -- Found rocm_smi at /usr/include -- Looking for C++ include /usr/include/rocm_smi/rocm_smi64Config.h -- Looking for C++ include /usr/include/rocm_smi/rocm_smi64Config.h - found -- RSMI_INIT_FLAG_THRAD_ONLY_MUTEX supported -- Performing Test HAVE_KERNARG_PRELOAD -- Performing Test HAVE_KERNARG_PRELOAD - Success -- Kernarg preloading to SGPR enabled -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/device_table.h -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/device_table.cpp -- Generating /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/host_table.cpp -- HIP_UNCACHED_MEMORY enabled -- RCCL LL128 protocol enabled -- Building shared RCCL library -- rocm-cmake: Set license file to /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/LICENSE.txt. -- Configuring done (32.2s) -- Generating done (0.0s) CMake Warning: Manually-specified variables were not used by the project: CMAKE_CXX_FLAGS_RELEASE CMAKE_C_FLAGS_RELEASE CMAKE_Fortran_FLAGS_RELEASE CMAKE_INSTALL_DO_STRIP CMAKE_VERBOSE_MAKEFILE LIB_SUFFIX SHARE_INSTALL_PREFIX SYSCONF_INSTALL_DIR -- Build files have been written to: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 + /usr/bin/cmake --build redhat-linux-build-gfx9 -j48 --verbose Change Dir: '/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9' Run Build Command(s): /usr/bin/ninja-build -v -j 48 [1/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && /usr/bin/cmake -P /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/cmake/scripts/git_version.cmake -- Updating git_version.cpp [2/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/init_nvtx.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc [3/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/alltoall_pivot.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h [4/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/broadcast.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h [5/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/channel.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc [6/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/register.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/register.cc [7/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/reduce.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h [8/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/debug.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/debug.cc [9/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/msccl.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc [10/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/graph/rome_models.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.h [11/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/primitives.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h [12/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/graph/rings.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rings.cc [13/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/graph/rings.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rings.h [14/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/graph/trees.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/trees.cc [15/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/archinfo.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/archinfo.h [16/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/network/unpack/unpack_defs.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack/unpack_defs.h [17/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/align.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/align.h [18/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/collectives.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc [19/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/common_kernel.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common_kernel.h [20/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/sendrecv.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h [21/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/graph/topo.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h [22/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/reduce_scatter.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h [23/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/group.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc [24/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/all_gather.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h [25/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/network/unpack/unpack.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack/unpack.h [26/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/op128.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/op128.h [27/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/graph/xml.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h [28/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/alloc.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h [29/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/bootstrap.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/bootstrap.cc [30/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/net.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/net.cc [31/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/prims_ll128.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h [32/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/transport.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport.cc [33/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/reduce_kernel.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_kernel.h [34/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/prims_ll.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h [35/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/graph/connect.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc [36/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/graph/tuning.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc [37/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/common.cu -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.cu.cpp [38/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/onerank.cu -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/onerank.cu.cpp [39/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/graph/paths.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc [40/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/graph/xml.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.cc [41/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/prims_simple.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h [42/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/graph/topo.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc [43/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/all_reduce.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h [44/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/common.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h [45/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/graph/search.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc [46/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/graph/rome_models.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc [47/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/proxy.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/proxy.cc [48/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/argcheck.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h [49/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/enqueue.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc [50/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/channel.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h [51/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/collectives.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/collectives.h [52/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/cpuset.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/cpuset.h [53/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/bootstrap.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/bootstrap.h [54/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/core.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h [55/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/BfdBacktrace.hpp -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/BfdBacktrace.hpp [56/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/init.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc [57/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/checks.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/checks.h [58/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/debug.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/debug.h [59/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/ibvsymbols.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/ibvsymbols.h [60/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/coll_net.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h [61/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/enqueue.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h [62/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/git_version.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/git_version.h [63/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/group.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/group.h [64/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/net_device.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net_device.h [65/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/comm.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h [66/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/info.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h [67/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/gdrwrap.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h [68/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/net.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h [69/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/ipcsocket.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/ipcsocket.h [70/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/ibvwrap.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/ibvwrap.h [71/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nccl_common.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nccl_common.h [72/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nccl_tuner.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nccl_tuner.h [73/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/profiler.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/profiler.h [74/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/graph.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h [75/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx_stub.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx_stub.h [76/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/device.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h [77/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx.h [78/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvmlwrap.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvmlwrap.h [79/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/param.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/param.h [80/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/register.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/register.h [81/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/ibvcore.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/ibvcore.h [82/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/p2p.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/p2p.h [83/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/proxy.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/proxy.h [84/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/rocm_smi_wrap.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rocm_smi_wrap.h [85/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/shm.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/shm.h [86/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/rocmwrap.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rocmwrap.h [87/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/rccl_vars.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_vars.h [88/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/roctx.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h [89/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/signals.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/signals.h [90/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/socket.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/socket.h [91/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nccl_net.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nccl_net.h [92/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/strongstream.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/strongstream.h [93/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/timer.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/timer.h [94/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/rccl_float8.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h [95/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/transport.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h [96/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/trees.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/trees.h [97/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/tuner.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/tuner.h [98/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/msccl/msccl_lifecycle.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_lifecycle.h [99/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/msccl/msccl_parser.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h [100/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/msccl/msccl_scheduler.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_scheduler.h [101/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/msccl/msccl_setup.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_setup.h [102/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/npkit && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/npkit/npkit_struct.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/npkit/npkit_struct.h [103/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/msccl/msccl_status.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_status.h [104/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/npkit && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/npkit/npkit.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/npkit/npkit.h [105/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/utils.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h [106/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvToolsExtOpenCL.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvToolsExtOpenCL.h [107/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/npkit && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/npkit/npkit_event.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/npkit/npkit_event.h [108/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/msccl/msccl_struct.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_struct.h [109/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCudaRt_v3.h [110/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvToolsExtCuda.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvToolsExtCuda.h [111/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvToolsExtCudaRt.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvToolsExtCudaRt.h [112/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCuda_v3.h [113/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail/nvtxImplSync_v3.h [114/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail/nvtxImplOpenCL_v3.h [115/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvToolsExtSync.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvToolsExtSync.h [116/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvtxDetail/nvtxImplCore.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail/nvtxImplCore.h [117/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail/nvtxLinkOnce.h [118/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvtxExtDetail/nvtxExtImpl.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtImpl.h [119/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvtxDetail/nvtxInit.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail/nvtxInit.h [120/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvtxDetail/nvtxInitDecls.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDecls.h [121/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvtxExtDetail/nvtxExtImplPayload_v1.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtImplPayload_v1.h [122/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvtxExtDetail/nvtxExtTypes.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtTypes.h [123/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvToolsExtPayload.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvToolsExtPayload.h [124/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/alt_rsmi.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alt_rsmi.h [125/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvtxExtDetail/nvtxExtPayloadTypeInfo.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtPayloadTypeInfo.h [126/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvtxDetail/nvtxImpl.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail/nvtxImpl.h [127/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/npkit.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/npkit.cc [128/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/nvmlwrap_stub.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/nvmlwrap_stub.cc [129/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvtxDetail/nvtxTypes.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail/nvtxTypes.h [130/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/ibvsymbols.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ibvsymbols.cc [131/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxExtDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvtxExtDetail/nvtxExtInit.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxExtDetail/nvtxExtInit.h [132/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/ipcsocket.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ipcsocket.cc [133/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvtxDetail/nvtxInitDefs.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtxDetail/nvtxInitDefs.h [134/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvToolsExt.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvToolsExt.h [135/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/rocmwrap.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/rocmwrap.cc [136/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/ibvwrap.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ibvwrap.cc [137/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/archinfo.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/archinfo.cc [138/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/argcheck.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/argcheck.cc [139/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/alt_rsmi.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc [140/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/param.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/param.cc [141/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/profiler.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/profiler.cc [142/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/rocm_smi_wrap.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/rocm_smi_wrap.cc [143/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/roctx.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/roctx.cc [144/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/tuner.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/tuner.cc [145/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/shmutils.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/shmutils.cc [146/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/signals.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/signals.cc [147/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/strongstream.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/strongstream.cc [148/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/socket.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/socket.cc [149/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/transport/net_socket.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_socket.cc [150/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3 && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/nvtx3/nvtx3.hpp -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp [151/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/transport/shm.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/shm.cc [152/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/msccl/msccl_lifecycle.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc [153/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/include/msccl/msccl_kernel.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_kernel.h [154/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/transport/coll_net.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc [155/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/msccl/msccl_parser.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc [156/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/msccl/msccl_status.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_status.cc [157/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/utils.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/utils.cc [158/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/misc/msccl/msccl_setup.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc [159/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/device/msccl_kernel_impl.h -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h [160/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/transport/nvls.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/nvls.cc [161/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/transport/p2p.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc [162/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/transport/net_ib.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc [163/356] cd /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9 && mkdir -p /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport && /usr/bin/hipify-perl -quiet-warnings /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/src/transport/net.cc -o /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc [164/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/archinfo.cc [165/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/trees.cc [166/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/tuner.cc [167/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/nvmlwrap_stub.cc [168/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ipcsocket.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ipcsocket.cc:8: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. [169/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ibvsymbols.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ibvsymbols.cc:67: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. [170/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/strongstream.cc [171/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/param.cc [172/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/rocmwrap.cc [173/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rings.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rings.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. [174/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/signals.cc [175/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/utils.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/utils.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. [176/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/debug.cc.o -MF CMakeFiles/rccl.dir/hipify/src/debug.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/debug.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/debug.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/debug.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. [177/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ibvwrap.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/ibvwrap.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/ibvwrap.h:21: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. [178/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/profiler.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/proxy.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/proxy.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/proxy.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/proxy.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/proxy.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/proxy.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/proxy.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/profiler.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/profiler.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/proxy.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. [179/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/argcheck.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/argcheck.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. [180/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/shmutils.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/shmutils.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. [181/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/register.cc.o -MF CMakeFiles/rccl.dir/hipify/src/register.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/register.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/register.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/register.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. [182/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o -MF CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx.h:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx.h:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx.h:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx.h:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx.h:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx.h:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ 4 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx.h:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init_nvtx.cc:4:42: warning: unused variable 'NvtxEnumRedSchema' [-Wunused-const-variable] 4 | static constexpr const nvtxPayloadEnum_t NvtxEnumRedSchema[] = { | ^~~~~~~~~~~~~~~~~ 4 warnings generated when compiling for host. [183/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 339 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 340 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 341 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:342:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 342 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:345:9: warning: unused variable 'ppn' [-Wunused-variable] 345 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:629:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 629 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 339 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 340 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 341 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:342:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 342 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:345:9: warning: unused variable 'ppn' [-Wunused-variable] 345 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:629:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 629 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 339 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 340 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 341 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:342:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 342 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:345:9: warning: unused variable 'ppn' [-Wunused-variable] 345 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:629:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 629 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 339 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 340 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 341 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:342:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 342 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:345:9: warning: unused variable 'ppn' [-Wunused-variable] 345 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:629:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 629 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 339 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 340 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 341 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:342:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 342 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:345:9: warning: unused variable 'ppn' [-Wunused-variable] 345 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:629:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 629 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 339 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 340 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 341 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:342:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 342 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:345:9: warning: unused variable 'ppn' [-Wunused-variable] 345 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:629:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 629 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:339:10: warning: unused variable 'llMaxBw' [-Wunused-variable] 339 | double llMaxBw = llMaxBws[index1][index2]; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:340:10: warning: unused variable 'perChMaxTreeBw' [-Wunused-variable] 340 | double perChMaxTreeBw = perChMaxTreeBws[compCapIndex][index2]; | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:341:10: warning: unused variable 'perChMaxRingLL128Bw' [-Wunused-variable] 341 | double perChMaxRingLL128Bw = perChMaxRingLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:342:10: warning: unused variable 'perChMaxTreeLL128Bw' [-Wunused-variable] 342 | double perChMaxTreeLL128Bw = perChMaxTreeLL128Bws[compCapIndex][index2]; | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:345:9: warning: unused variable 'ppn' [-Wunused-variable] 345 | float ppn = (float)nRanks / nNodes; // if ppn < 2, then we are sending/receiving at the same GPU through the NIC, apply some bw discount | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/tuning.cc:629:14: warning: unused variable 'treeCorrectionFactor' [-Wunused-variable] 629 | static float treeCorrectionFactor[NCCL_NUM_PROTOCOLS][23] = { | ^~~~~~~~~~~~~~~~~~~~ 14 warnings generated when compiling for host. [184/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/net.cc.o -MF CMakeFiles/rccl.dir/hipify/src/net.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/net.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/net.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. [185/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.cc:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.cc:16: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 7 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.cc:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.cc:16: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 7 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.cc:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.cc:16: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 7 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.cc:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.cc:16: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 7 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.cc:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.cc:16: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 7 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.cc:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.cc:16: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 7 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.cc:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.cc:16: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 7 warnings generated when compiling for host. [186/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/bootstrap.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/bootstrap.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/bootstrap.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/bootstrap.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/bootstrap.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/bootstrap.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/bootstrap.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/bootstrap.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/bootstrap.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/bootstrap.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/bootstrap.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/bootstrap.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/bootstrap.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/bootstrap.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/bootstrap.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/bootstrap.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. [187/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. [188/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/rocm_smi_wrap.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/rocm_smi_wrap.cc:24: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 1 warning generated when compiling for host. [189/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1031:7: warning: unused variable 'nChannels' [-Wunused-variable] 1031 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1041:12: warning: unused variable 'y' [-Wunused-variable] 1041 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1496:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1496 | static char ringRemap[64]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1500:7: warning: unused variable 'ncpus' [-Wunused-variable] 1500 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1590:9: warning: unused variable 't' [-Wunused-variable] 1590 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1691 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1664:7: note: declared here 1664 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1691 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1664:7: note: declared here 1664 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1661:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1661 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1682:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1682 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1757:9: warning: unused variable 't' [-Wunused-variable] 1757 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:15: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1815 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:15: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1798:7: note: declared here 1798 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:31: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1815 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:31: note: read of non-const variable 'nnets' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1799:7: note: declared here 1799 | int nnets = system->nodes[NET].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1796:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1796 | static char ringRemap[256]; | ^~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:22: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:24: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:25: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 36 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1031:7: warning: unused variable 'nChannels' [-Wunused-variable] 1031 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1041:12: warning: unused variable 'y' [-Wunused-variable] 1041 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1496:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1496 | static char ringRemap[64]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1500:7: warning: unused variable 'ncpus' [-Wunused-variable] 1500 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1590:9: warning: unused variable 't' [-Wunused-variable] 1590 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1691 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1664:7: note: declared here 1664 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1691 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1664:7: note: declared here 1664 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1661:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1661 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1682:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1682 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1757:9: warning: unused variable 't' [-Wunused-variable] 1757 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:15: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1815 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:15: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1798:7: note: declared here 1798 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:31: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1815 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:31: note: read of non-const variable 'nnets' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1799:7: note: declared here 1799 | int nnets = system->nodes[NET].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1796:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1796 | static char ringRemap[256]; | ^~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:22: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:24: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:25: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 36 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1031:7: warning: unused variable 'nChannels' [-Wunused-variable] 1031 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1041:12: warning: unused variable 'y' [-Wunused-variable] 1041 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1496:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1496 | static char ringRemap[64]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1500:7: warning: unused variable 'ncpus' [-Wunused-variable] 1500 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1590:9: warning: unused variable 't' [-Wunused-variable] 1590 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1691 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1664:7: note: declared here 1664 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1691 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1664:7: note: declared here 1664 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1661:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1661 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1682:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1682 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1757:9: warning: unused variable 't' [-Wunused-variable] 1757 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:15: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1815 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:15: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1798:7: note: declared here 1798 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:31: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1815 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:31: note: read of non-const variable 'nnets' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1799:7: note: declared here 1799 | int nnets = system->nodes[NET].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1796:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1796 | static char ringRemap[256]; | ^~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:22: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:24: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:25: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 36 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1031:7: warning: unused variable 'nChannels' [-Wunused-variable] 1031 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1041:12: warning: unused variable 'y' [-Wunused-variable] 1041 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1496:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1496 | static char ringRemap[64]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1500:7: warning: unused variable 'ncpus' [-Wunused-variable] 1500 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1590:9: warning: unused variable 't' [-Wunused-variable] 1590 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1691 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1664:7: note: declared here 1664 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1691 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1664:7: note: declared here 1664 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1661:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1661 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1682:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1682 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1757:9: warning: unused variable 't' [-Wunused-variable] 1757 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:15: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1815 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:15: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1798:7: note: declared here 1798 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:31: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1815 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:31: note: read of non-const variable 'nnets' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1799:7: note: declared here 1799 | int nnets = system->nodes[NET].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1796:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1796 | static char ringRemap[256]; | ^~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:22: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:24: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:25: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 36 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1031:7: warning: unused variable 'nChannels' [-Wunused-variable] 1031 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1041:12: warning: unused variable 'y' [-Wunused-variable] 1041 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1496:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1496 | static char ringRemap[64]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1500:7: warning: unused variable 'ncpus' [-Wunused-variable] 1500 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1590:9: warning: unused variable 't' [-Wunused-variable] 1590 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1691 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1664:7: note: declared here 1664 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1691 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1664:7: note: declared here 1664 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1661:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1661 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1682:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1682 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1757:9: warning: unused variable 't' [-Wunused-variable] 1757 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:15: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1815 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:15: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1798:7: note: declared here 1798 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:31: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1815 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:31: note: read of non-const variable 'nnets' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1799:7: note: declared here 1799 | int nnets = system->nodes[NET].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1796:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1796 | static char ringRemap[256]; | ^~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:22: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:24: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:25: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 36 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1031:7: warning: unused variable 'nChannels' [-Wunused-variable] 1031 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1041:12: warning: unused variable 'y' [-Wunused-variable] 1041 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1496:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1496 | static char ringRemap[64]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1500:7: warning: unused variable 'ncpus' [-Wunused-variable] 1500 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1590:9: warning: unused variable 't' [-Wunused-variable] 1590 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1691 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1664:7: note: declared here 1664 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1691 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1664:7: note: declared here 1664 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1661:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1661 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1682:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1682 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1757:9: warning: unused variable 't' [-Wunused-variable] 1757 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:15: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1815 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:15: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1798:7: note: declared here 1798 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:31: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1815 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:31: note: read of non-const variable 'nnets' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1799:7: note: declared here 1799 | int nnets = system->nodes[NET].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1796:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1796 | static char ringRemap[256]; | ^~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:22: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:24: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:25: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 36 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:23: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1031:7: warning: unused variable 'nChannels' [-Wunused-variable] 1031 | int nChannels = 0; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1041:12: warning: unused variable 'y' [-Wunused-variable] 1041 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1496:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1496 | static char ringRemap[64]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1500:7: warning: unused variable 'ncpus' [-Wunused-variable] 1500 | int ncpus = system->nodes[CPU].count; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1590:9: warning: unused variable 't' [-Wunused-variable] 1590 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:14: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1691 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:14: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1664:7: note: declared here 1664 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:24: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1691 | int j, r[ngpus], g[ngpus]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1691:24: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1664:7: note: declared here 1664 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1661:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1661 | static char ringRemap[256]; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1682:7: warning: variable 'gcnt' set but not used [-Wunused-but-set-variable] 1682 | int gcnt = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1757:9: warning: unused variable 't' [-Wunused-variable] 1757 | float t = (tve.tv_sec - tvs.tv_sec)*1E3 + (tve.tv_usec - tvs.tv_usec)/1E3; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:15: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1815 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:15: note: read of non-const variable 'ngpus' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1798:7: note: declared here 1798 | int ngpus = system->nodes[GPU].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:31: warning: variable length arrays in C++ are a Clang extension [-Wvla-cxx-extension] 1815 | int g_hives[ngpus], n_hives[nnets]; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1815:31: note: read of non-const variable 'nnets' is not allowed in a constant expression /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1799:7: note: declared here 1799 | int nnets = system->nodes[NET].count; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:1796:15: warning: unused variable 'ringRemap' [-Wunused-variable] 1796 | static char ringRemap[256]; | ^~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:22: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:24: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/rome_models.cc:25: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 36 warnings generated when compiling for host. [190/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/roctx.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 3 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 3 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 3 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 3 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 3 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 3 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1940:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1940 | 0, // payload value (union) | ^ | {} /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/nvtx3/nvtx3.hpp:1942:9: warning: suggest braces around initialization of subobject [-Wmissing-braces] 1942 | 0 // message value (union) | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/roctx.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/roctx.h:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 3 warnings generated when compiling for host. [191/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/search.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ 14 warnings generated when compiling for host. [192/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 24 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 24 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 24 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 24 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 24 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 24 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.cc:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 24 warnings generated when compiling for host. [193/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/proxy.cc.o -MF CMakeFiles/rccl.dir/hipify/src/proxy.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/proxy.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/proxy.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/proxy.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. [194/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 4 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 4 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 4 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 4 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 4 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 4 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:711:16: warning: unused variable 'ret' [-Wunused-variable] 711 | ncclResult_t ret = ncclSuccess; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:723:16: warning: unused variable 'ret' [-Wunused-variable] 723 | ncclResult_t ret = ncclSuccess; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_parser.cc:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 4 warnings generated when compiling for host. [195/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/socket.cc /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/socket.cc:598:8: warning: unused variable 'line' [-Wunused-variable] 598 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/socket.cc:8: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx900. /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/socket.cc:598:8: warning: unused variable 'line' [-Wunused-variable] 598 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/socket.cc:8: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx906. /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/socket.cc:598:8: warning: unused variable 'line' [-Wunused-variable] 598 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/socket.cc:8: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx908. /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/socket.cc:598:8: warning: unused variable 'line' [-Wunused-variable] 598 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/socket.cc:8: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/socket.cc:598:8: warning: unused variable 'line' [-Wunused-variable] 598 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/socket.cc:8: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/socket.cc:598:8: warning: unused variable 'line' [-Wunused-variable] 598 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/socket.cc:8: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx942. /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/socket.cc:598:8: warning: unused variable 'line' [-Wunused-variable] 598 | char line[SOCKET_NAME_MAXLEN+1]; | ^~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/socket.cc:8: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. [196/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_status.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_status.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_status.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_struct.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for host. [197/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/collectives.cc.o -MF CMakeFiles/rccl.dir/hipify/src/collectives.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/collectives.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:20:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 20 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:23:10: warning: unused variable 'msgsize' [-Wunused-variable] 23 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:47:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 47 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:52:23: warning: unused variable 'payload' [-Wunused-variable] 52 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:72:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 72 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:75:10: warning: unused variable 'msgsize' [-Wunused-variable] 75 | size_t msgsize = count * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:118:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 118 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:122:23: warning: unused variable 'payload' [-Wunused-variable] 122 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype)}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:162:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 162 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:166:23: warning: unused variable 'payload' [-Wunused-variable] 166 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:196:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 196 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:200:22: warning: unused variable 'payload' [-Wunused-variable] 200 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:234:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 234 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:240:20: warning: unused variable 'payload' [-Wunused-variable] 240 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:263:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 263 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:268:27: warning: unused variable 'payload' [-Wunused-variable] 268 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:291:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 291 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:295:23: warning: unused variable 'payload' [-Wunused-variable] 295 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:333:22: warning: unused variable 'payload' [-Wunused-variable] 333 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:356:22: warning: unused variable 'payload' [-Wunused-variable] 356 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:324:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 324 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ 30 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:20:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 20 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:23:10: warning: unused variable 'msgsize' [-Wunused-variable] 23 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:47:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 47 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:52:23: warning: unused variable 'payload' [-Wunused-variable] 52 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:72:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 72 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:75:10: warning: unused variable 'msgsize' [-Wunused-variable] 75 | size_t msgsize = count * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:118:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 118 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:122:23: warning: unused variable 'payload' [-Wunused-variable] 122 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype)}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:162:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 162 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:166:23: warning: unused variable 'payload' [-Wunused-variable] 166 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:196:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 196 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:200:22: warning: unused variable 'payload' [-Wunused-variable] 200 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:234:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 234 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:240:20: warning: unused variable 'payload' [-Wunused-variable] 240 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:263:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 263 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:268:27: warning: unused variable 'payload' [-Wunused-variable] 268 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:291:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 291 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:295:23: warning: unused variable 'payload' [-Wunused-variable] 295 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:333:22: warning: unused variable 'payload' [-Wunused-variable] 333 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:356:22: warning: unused variable 'payload' [-Wunused-variable] 356 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:324:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 324 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ 30 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:20:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 20 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:23:10: warning: unused variable 'msgsize' [-Wunused-variable] 23 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:47:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 47 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:52:23: warning: unused variable 'payload' [-Wunused-variable] 52 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:72:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 72 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:75:10: warning: unused variable 'msgsize' [-Wunused-variable] 75 | size_t msgsize = count * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:118:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 118 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:122:23: warning: unused variable 'payload' [-Wunused-variable] 122 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype)}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:162:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 162 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:166:23: warning: unused variable 'payload' [-Wunused-variable] 166 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:196:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 196 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:200:22: warning: unused variable 'payload' [-Wunused-variable] 200 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:234:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 234 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:240:20: warning: unused variable 'payload' [-Wunused-variable] 240 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:263:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 263 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:268:27: warning: unused variable 'payload' [-Wunused-variable] 268 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:291:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 291 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:295:23: warning: unused variable 'payload' [-Wunused-variable] 295 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:333:22: warning: unused variable 'payload' [-Wunused-variable] 333 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:356:22: warning: unused variable 'payload' [-Wunused-variable] 356 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:324:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 324 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ 30 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:20:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 20 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:23:10: warning: unused variable 'msgsize' [-Wunused-variable] 23 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:47:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 47 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:52:23: warning: unused variable 'payload' [-Wunused-variable] 52 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:72:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 72 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:75:10: warning: unused variable 'msgsize' [-Wunused-variable] 75 | size_t msgsize = count * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:118:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 118 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:122:23: warning: unused variable 'payload' [-Wunused-variable] 122 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype)}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:162:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 162 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:166:23: warning: unused variable 'payload' [-Wunused-variable] 166 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:196:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 196 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:200:22: warning: unused variable 'payload' [-Wunused-variable] 200 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:234:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 234 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:240:20: warning: unused variable 'payload' [-Wunused-variable] 240 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:263:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 263 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:268:27: warning: unused variable 'payload' [-Wunused-variable] 268 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:291:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 291 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:295:23: warning: unused variable 'payload' [-Wunused-variable] 295 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:333:22: warning: unused variable 'payload' [-Wunused-variable] 333 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:356:22: warning: unused variable 'payload' [-Wunused-variable] 356 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:324:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 324 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ 30 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:20:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 20 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:23:10: warning: unused variable 'msgsize' [-Wunused-variable] 23 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:47:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 47 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:52:23: warning: unused variable 'payload' [-Wunused-variable] 52 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:72:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 72 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:75:10: warning: unused variable 'msgsize' [-Wunused-variable] 75 | size_t msgsize = count * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:118:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 118 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:122:23: warning: unused variable 'payload' [-Wunused-variable] 122 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype)}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:162:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 162 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:166:23: warning: unused variable 'payload' [-Wunused-variable] 166 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:196:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 196 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:200:22: warning: unused variable 'payload' [-Wunused-variable] 200 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:234:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 234 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:240:20: warning: unused variable 'payload' [-Wunused-variable] 240 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:263:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 263 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:268:27: warning: unused variable 'payload' [-Wunused-variable] 268 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:291:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 291 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:295:23: warning: unused variable 'payload' [-Wunused-variable] 295 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:333:22: warning: unused variable 'payload' [-Wunused-variable] 333 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:356:22: warning: unused variable 'payload' [-Wunused-variable] 356 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:324:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 324 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ 30 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:20:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 20 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:23:10: warning: unused variable 'msgsize' [-Wunused-variable] 23 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:47:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 47 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:52:23: warning: unused variable 'payload' [-Wunused-variable] 52 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:72:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 72 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:75:10: warning: unused variable 'msgsize' [-Wunused-variable] 75 | size_t msgsize = count * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:118:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 118 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:122:23: warning: unused variable 'payload' [-Wunused-variable] 122 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype)}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:162:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 162 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:166:23: warning: unused variable 'payload' [-Wunused-variable] 166 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:196:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 196 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:200:22: warning: unused variable 'payload' [-Wunused-variable] 200 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:234:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 234 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:240:20: warning: unused variable 'payload' [-Wunused-variable] 240 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:263:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 263 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:268:27: warning: unused variable 'payload' [-Wunused-variable] 268 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:291:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 291 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:295:23: warning: unused variable 'payload' [-Wunused-variable] 295 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:333:22: warning: unused variable 'payload' [-Wunused-variable] 333 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:356:22: warning: unused variable 'payload' [-Wunused-variable] 356 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:324:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 324 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ 30 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:20:38: warning: unused variable 'AllGatherSchema' [-Wunused-variable] 20 | constexpr nvtxPayloadSchemaEntry_t AllGatherSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:23:10: warning: unused variable 'msgsize' [-Wunused-variable] 23 | size_t msgsize = sendcount * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:47:45: warning: unused variable 'AllReduceSchema' [-Wunused-variable] 47 | static constexpr nvtxPayloadSchemaEntry_t AllReduceSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:52:23: warning: unused variable 'payload' [-Wunused-variable] 52 | NvtxParamsAllReduce payload{count * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:72:38: warning: unused variable 'AllToAllSchema' [-Wunused-variable] 72 | constexpr nvtxPayloadSchemaEntry_t AllToAllSchema[] = { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:75:10: warning: unused variable 'msgsize' [-Wunused-variable] 75 | size_t msgsize = count * ncclTypeSize(datatype); | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:118:38: warning: unused variable 'AllToAllvSchema' [-Wunused-variable] 118 | constexpr nvtxPayloadSchemaEntry_t AllToAllvSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:122:23: warning: unused variable 'payload' [-Wunused-variable] 122 | NvtxParamsAllToAllv payload{sendcounts[comm->rank] * ncclTypeSize(datatype), recvcounts[comm->rank] * ncclTypeSize(datatype)}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:162:38: warning: unused variable 'BroadcastSchema' [-Wunused-variable] 162 | constexpr nvtxPayloadSchemaEntry_t BroadcastSchema[] = { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:166:23: warning: unused variable 'payload' [-Wunused-variable] 166 | NvtxParamsBroadcast payload{count * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:196:40: warning: unused variable 'GatherSchema' [-Wunused-variable] 196 | constexpr nvtxPayloadSchemaEntry_t GatherSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:200:22: warning: unused variable 'payload' [-Wunused-variable] 200 | NvtxParamsGather payload{sendcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:234:38: warning: unused variable 'ReduceSchema' [-Wunused-variable] 234 | constexpr nvtxPayloadSchemaEntry_t ReduceSchema[] = { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:240:20: warning: unused variable 'payload' [-Wunused-variable] 240 | NvtxParamsReduce payload{count * ncclTypeSize(datatype), root, op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:263:38: warning: unused variable 'ReduceScatterSchema' [-Wunused-variable] 263 | constexpr nvtxPayloadSchemaEntry_t ReduceScatterSchema[] = { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:268:27: warning: unused variable 'payload' [-Wunused-variable] 268 | NvtxParamsReduceScatter payload{recvcount * ncclTypeSize(datatype), op}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:291:40: warning: unused variable 'ScatterSchema' [-Wunused-variable] 291 | constexpr nvtxPayloadSchemaEntry_t ScatterSchema[] = { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:295:23: warning: unused variable 'payload' [-Wunused-variable] 295 | NvtxParamsScatter payload{recvcount * ncclTypeSize(datatype), root}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:333:22: warning: unused variable 'payload' [-Wunused-variable] 333 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:356:22: warning: unused variable 'payload' [-Wunused-variable] 356 | NvtxParamsSendRecv payload{count * ncclTypeSize(datatype), peer}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/argcheck.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/collectives.cc:324:42: warning: unused variable 'SendRecvSchema' [-Wunused-const-variable] 324 | constexpr const nvtxPayloadSchemaEntry_t SendRecvSchema[] = { | ^~~~~~~~~~~~~~ 30 warnings generated when compiling for host. [198/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:119:12: warning: unused variable 'y' [-Wunused-variable] 119 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:126:7: warning: unused variable 'localRanks' [-Wunused-variable] 126 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:260:21: warning: unused function 'getIndexes' [-Wunused-function] 260 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:119:12: warning: unused variable 'y' [-Wunused-variable] 119 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:126:7: warning: unused variable 'localRanks' [-Wunused-variable] 126 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:260:21: warning: unused function 'getIndexes' [-Wunused-function] 260 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:119:12: warning: unused variable 'y' [-Wunused-variable] 119 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:126:7: warning: unused variable 'localRanks' [-Wunused-variable] 126 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:260:21: warning: unused function 'getIndexes' [-Wunused-function] 260 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:119:12: warning: unused variable 'y' [-Wunused-variable] 119 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:126:7: warning: unused variable 'localRanks' [-Wunused-variable] 126 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:260:21: warning: unused function 'getIndexes' [-Wunused-function] 260 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:119:12: warning: unused variable 'y' [-Wunused-variable] 119 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:126:7: warning: unused variable 'localRanks' [-Wunused-variable] 126 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:260:21: warning: unused function 'getIndexes' [-Wunused-function] 260 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:119:12: warning: unused variable 'y' [-Wunused-variable] 119 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:126:7: warning: unused variable 'localRanks' [-Wunused-variable] 126 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:260:21: warning: unused function 'getIndexes' [-Wunused-function] 260 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:119:12: warning: unused variable 'y' [-Wunused-variable] 119 | int x=0, y=0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:126:7: warning: unused variable 'localRanks' [-Wunused-variable] 126 | int localRanks = comm->topo->nodes[GPU].count; | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/connect.cc:260:21: warning: unused function 'getIndexes' [-Wunused-function] 260 | static ncclResult_t getIndexes(int* ranks, int* indexes, int nNodes) { | ^~~~~~~~~~ 11 warnings generated when compiling for host. [199/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/group.cc.o -MF CMakeFiles/rccl.dir/hipify/src/group.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/group.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 3 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 3 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 3 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 3 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 3 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 3 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/group.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/group.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 3 warnings generated when compiling for host. [200/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/msccl.cc.o -MF CMakeFiles/rccl.dir/hipify/src/msccl.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/msccl.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:52:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 52 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:56:19: warning: unused variable 'payload' [-Wunused-variable] 56 | NvtxParamsMsccl payload{sendCounts[comm->rank] * ncclTypeSize(dataType), recvCounts[comm->rank] * ncclTypeSize(dataType)}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ 7 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:52:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 52 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:56:19: warning: unused variable 'payload' [-Wunused-variable] 56 | NvtxParamsMsccl payload{sendCounts[comm->rank] * ncclTypeSize(dataType), recvCounts[comm->rank] * ncclTypeSize(dataType)}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ 7 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:52:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 52 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:56:19: warning: unused variable 'payload' [-Wunused-variable] 56 | NvtxParamsMsccl payload{sendCounts[comm->rank] * ncclTypeSize(dataType), recvCounts[comm->rank] * ncclTypeSize(dataType)}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ 7 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:52:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 52 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:56:19: warning: unused variable 'payload' [-Wunused-variable] 56 | NvtxParamsMsccl payload{sendCounts[comm->rank] * ncclTypeSize(dataType), recvCounts[comm->rank] * ncclTypeSize(dataType)}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ 7 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:52:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 52 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:56:19: warning: unused variable 'payload' [-Wunused-variable] 56 | NvtxParamsMsccl payload{sendCounts[comm->rank] * ncclTypeSize(dataType), recvCounts[comm->rank] * ncclTypeSize(dataType)}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ 7 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:52:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 52 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:56:19: warning: unused variable 'payload' [-Wunused-variable] 56 | NvtxParamsMsccl payload{sendCounts[comm->rank] * ncclTypeSize(dataType), recvCounts[comm->rank] * ncclTypeSize(dataType)}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ 7 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:52:38: warning: unused variable 'MscclSchema' [-Wunused-variable] 52 | constexpr nvtxPayloadSchemaEntry_t MscclSchema[] = { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:56:19: warning: unused variable 'payload' [-Wunused-variable] 56 | NvtxParamsMsccl payload{sendCounts[comm->rank] * ncclTypeSize(dataType), recvCounts[comm->rank] * ncclTypeSize(dataType)}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/msccl.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ 7 warnings generated when compiling for host. [201/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o -MF CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:457:24: warning: unused variable 'gpu' [-Wunused-variable] 457 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:457:24: warning: unused variable 'gpu' [-Wunused-variable] 457 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:457:24: warning: unused variable 'gpu' [-Wunused-variable] 457 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:457:24: warning: unused variable 'gpu' [-Wunused-variable] 457 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:457:24: warning: unused variable 'gpu' [-Wunused-variable] 457 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:457:24: warning: unused variable 'gpu' [-Wunused-variable] 457 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:270:7: warning: variable 'intermediateIndex' set but not used [-Wunused-but-set-variable] 270 | int intermediateIndex = -1; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:457:24: warning: unused variable 'gpu' [-Wunused-variable] 457 | struct ncclTopoNode* gpu = system->nodes[GPU].nodes+g; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:10: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/paths.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 23 warnings generated when compiling for host. [202/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:72:16: warning: unused variable 'status' [-Wunused-variable] 72 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:128:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 128 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 5 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:72:16: warning: unused variable 'status' [-Wunused-variable] 72 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:128:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 128 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 5 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:72:16: warning: unused variable 'status' [-Wunused-variable] 72 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:128:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 128 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 5 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:72:16: warning: unused variable 'status' [-Wunused-variable] 72 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:128:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 128 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 5 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:72:16: warning: unused variable 'status' [-Wunused-variable] 72 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:128:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 128 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 5 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:72:16: warning: unused variable 'status' [-Wunused-variable] 72 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:128:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 128 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 5 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:72:16: warning: unused variable 'status' [-Wunused-variable] 72 | mscclStatus& status = mscclGetStatus(); | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:128:27: warning: unused variable 'threadLocalStatus' [-Wunused-variable] 128 | mscclThreadLocalStatus& threadLocalStatus = mscclGetThreadLocalStatus(); | ^~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_setup.cc:6: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ 5 warnings generated when compiling for host. [203/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/npkit.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/npkit.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/npkit.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/npkit.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/npkit.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/npkit.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/npkit.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/npkit.cc:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/npkit/npkit.h:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/npkit.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. [204/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:103:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 103 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:101:13: warning: unused variable 'ret_domain' [-Wunused-variable] 101 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:232:22: warning: unused variable 'hops' [-Wunused-variable] 232 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:68:14: warning: unused variable 'count' [-Wunused-variable] 68 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:50:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 50 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:537:13: warning: unused function 'fileExists' [-Wunused-function] 537 | static bool fileExists(char const *filename) | ^~~~~~~~~~ 6 warnings generated when compiling for gfx900. /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:103:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 103 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:101:13: warning: unused variable 'ret_domain' [-Wunused-variable] 101 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:232:22: warning: unused variable 'hops' [-Wunused-variable] 232 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:68:14: warning: unused variable 'count' [-Wunused-variable] 68 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:50:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 50 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:537:13: warning: unused function 'fileExists' [-Wunused-function] 537 | static bool fileExists(char const *filename) | ^~~~~~~~~~ 6 warnings generated when compiling for gfx906. /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:103:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 103 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:101:13: warning: unused variable 'ret_domain' [-Wunused-variable] 101 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:232:22: warning: unused variable 'hops' [-Wunused-variable] 232 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:68:14: warning: unused variable 'count' [-Wunused-variable] 68 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:50:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 50 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:537:13: warning: unused function 'fileExists' [-Wunused-function] 537 | static bool fileExists(char const *filename) | ^~~~~~~~~~ 6 warnings generated when compiling for gfx908. /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:103:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 103 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:101:13: warning: unused variable 'ret_domain' [-Wunused-variable] 101 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:232:22: warning: unused variable 'hops' [-Wunused-variable] 232 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:68:14: warning: unused variable 'count' [-Wunused-variable] 68 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:50:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 50 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:537:13: warning: unused function 'fileExists' [-Wunused-function] 537 | static bool fileExists(char const *filename) | ^~~~~~~~~~ 6 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:103:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 103 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:101:13: warning: unused variable 'ret_domain' [-Wunused-variable] 101 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:232:22: warning: unused variable 'hops' [-Wunused-variable] 232 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:68:14: warning: unused variable 'count' [-Wunused-variable] 68 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:50:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 50 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:537:13: warning: unused function 'fileExists' [-Wunused-function] 537 | static bool fileExists(char const *filename) | ^~~~~~~~~~ 6 warnings generated when compiling for gfx90a. /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:103:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 103 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:101:13: warning: unused variable 'ret_domain' [-Wunused-variable] 101 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:232:22: warning: unused variable 'hops' [-Wunused-variable] 232 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:68:14: warning: unused variable 'count' [-Wunused-variable] 68 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:50:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 50 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:537:13: warning: unused function 'fileExists' [-Wunused-function] 537 | static bool fileExists(char const *filename) | ^~~~~~~~~~ 6 warnings generated when compiling for gfx942. /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:103:33: warning: bitwise negation of a boolean expression always evaluates to 'true'; did you mean logical negation? [-Wbool-operation] 103 | if (ret_gpu_id == 0 && ~(ret_unique_id != 0 || ret_loc_id != 0 || ret_unique_id != 0 || ret_vendor != 0) && | ^~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ! /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:101:13: warning: unused variable 'ret_domain' [-Wunused-variable] 101 | int ret_domain = read_node_properties(node_id, "domain", &domain, properties); | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:232:22: warning: unused variable 'hops' [-Wunused-variable] 232 | uint64_t hops; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:68:14: warning: unused variable 'count' [-Wunused-variable] 68 | uint32_t count = 0; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:50:20: warning: unused variable 'kPathDRMRoot' [-Wunused-variable] 50 | static const char *kPathDRMRoot = "/sys/class/drm"; | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/alt_rsmi.cc:537:13: warning: unused function 'fileExists' [-Wunused-function] 537 | static bool fileExists(char const *filename) | ^~~~~~~~~~ 6 warnings generated when compiling for host. [205/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/channel.cc.o -MF CMakeFiles/rccl.dir/hipify/src/channel.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/channel.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:7: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:41:21: warning: unused function 'ncclChannelCompute' [-Wunused-function] 41 | static ncclResult_t ncclChannelCompute(struct ncclComm* comm, int peer, int channelInc, int coll, int*channelId) { | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/channel.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ 9 warnings generated when compiling for host. [206/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:399:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 399 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:399:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 399 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:399:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 399 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:399:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 399 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:399:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 399 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:399:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 399 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ 23 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:9: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:196:21: warning: unused function 'collNetDumpMap' [-Wunused-function] 196 | static ncclResult_t collNetDumpMap(struct connectMap* map) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/coll_net.cc:399:21: warning: unused function 'sharedBuffersGet' [-Wunused-function] 399 | static ncclResult_t sharedBuffersGet(struct ncclCollNetSharedRes* collNet, int type, int slot, int channel, int* offset) { | ^~~~~~~~~~~~~~~~ 23 warnings generated when compiling for host. [207/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o -MF CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ 13 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ 13 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ 13 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ 13 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ 13 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ 13 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:18: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:16: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:18: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:21: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:75:21: warning: unused function 'mscclXmlGetAttrInt' [-Wunused-function] 75 | static ncclResult_t mscclXmlGetAttrInt(struct mscclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:82:21: warning: unused function 'mscclXmlGetAttrInt64' [-Wunused-function] 82 | static ncclResult_t mscclXmlGetAttrInt64(struct mscclXmlNode* node, const char* attrName, int64_t* value) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/msccl/msccl_parser.h:89:21: warning: unused function 'mscclXmlFindTag' [-Wunused-function] 89 | static ncclResult_t mscclXmlFindTag(struct mscclXml* xml, const char* tagName, struct mscclXmlNode** node) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/misc/msccl/msccl_lifecycle.cc:27:20: warning: unused variable 'mscclAlgoFilePathEnv' [-Wunused-variable] 27 | static const char* mscclAlgoFilePathEnv = "MSCCL_ALGO_FILE_PATH"; | ^~~~~~~~~~~~~~~~~~~~ 13 warnings generated when compiling for host. [208/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o -MF CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:81:5: warning: unused label 'ignore0' [-Wunused-label] 81 | ignore0:; | ^~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:380:7: warning: variable 'rnChannels' set but not used [-Wunused-but-set-variable] 380 | int rnChannels = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:487:7: warning: variable 'rnChannel' set but not used [-Wunused-but-set-variable] 487 | int rnChannel = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:591:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 591 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:43:21: warning: unused function 'computeColl' [-Wunused-function] 43 | static ncclResult_t computeColl(struct ncclInfo* info /* input */, int* workFuncIndex, struct ncclWorkElem* work, struct ncclProxyOp* proxyOp /* output */); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:57:21: warning: unused function 'getLoopInfo' [-Wunused-function] 57 | static ncclResult_t getLoopInfo(struct ncclInfo* collInfo); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:745:21: warning: unused function 'getCBDCollnChannel' [-Wunused-function] 745 | static ncclResult_t getCBDCollnChannel(struct ncclKernelPlan* plan, struct ncclInfo* collInfo, int usableChannels) { | ^~~~~~~~~~~~~~~~~~ 36 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:81:5: warning: unused label 'ignore0' [-Wunused-label] 81 | ignore0:; | ^~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:380:7: warning: variable 'rnChannels' set but not used [-Wunused-but-set-variable] 380 | int rnChannels = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:487:7: warning: variable 'rnChannel' set but not used [-Wunused-but-set-variable] 487 | int rnChannel = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:591:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 591 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:43:21: warning: unused function 'computeColl' [-Wunused-function] 43 | static ncclResult_t computeColl(struct ncclInfo* info /* input */, int* workFuncIndex, struct ncclWorkElem* work, struct ncclProxyOp* proxyOp /* output */); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:57:21: warning: unused function 'getLoopInfo' [-Wunused-function] 57 | static ncclResult_t getLoopInfo(struct ncclInfo* collInfo); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:745:21: warning: unused function 'getCBDCollnChannel' [-Wunused-function] 745 | static ncclResult_t getCBDCollnChannel(struct ncclKernelPlan* plan, struct ncclInfo* collInfo, int usableChannels) { | ^~~~~~~~~~~~~~~~~~ 36 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:81:5: warning: unused label 'ignore0' [-Wunused-label] 81 | ignore0:; | ^~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:380:7: warning: variable 'rnChannels' set but not used [-Wunused-but-set-variable] 380 | int rnChannels = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:487:7: warning: variable 'rnChannel' set but not used [-Wunused-but-set-variable] 487 | int rnChannel = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:591:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 591 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:43:21: warning: unused function 'computeColl' [-Wunused-function] 43 | static ncclResult_t computeColl(struct ncclInfo* info /* input */, int* workFuncIndex, struct ncclWorkElem* work, struct ncclProxyOp* proxyOp /* output */); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:57:21: warning: unused function 'getLoopInfo' [-Wunused-function] 57 | static ncclResult_t getLoopInfo(struct ncclInfo* collInfo); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:745:21: warning: unused function 'getCBDCollnChannel' [-Wunused-function] 745 | static ncclResult_t getCBDCollnChannel(struct ncclKernelPlan* plan, struct ncclInfo* collInfo, int usableChannels) { | ^~~~~~~~~~~~~~~~~~ 36 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:81:5: warning: unused label 'ignore0' [-Wunused-label] 81 | ignore0:; | ^~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:380:7: warning: variable 'rnChannels' set but not used [-Wunused-but-set-variable] 380 | int rnChannels = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:487:7: warning: variable 'rnChannel' set but not used [-Wunused-but-set-variable] 487 | int rnChannel = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:591:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 591 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:43:21: warning: unused function 'computeColl' [-Wunused-function] 43 | static ncclResult_t computeColl(struct ncclInfo* info /* input */, int* workFuncIndex, struct ncclWorkElem* work, struct ncclProxyOp* proxyOp /* output */); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:57:21: warning: unused function 'getLoopInfo' [-Wunused-function] 57 | static ncclResult_t getLoopInfo(struct ncclInfo* collInfo); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:745:21: warning: unused function 'getCBDCollnChannel' [-Wunused-function] 745 | static ncclResult_t getCBDCollnChannel(struct ncclKernelPlan* plan, struct ncclInfo* collInfo, int usableChannels) { | ^~~~~~~~~~~~~~~~~~ 36 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:81:5: warning: unused label 'ignore0' [-Wunused-label] 81 | ignore0:; | ^~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:380:7: warning: variable 'rnChannels' set but not used [-Wunused-but-set-variable] 380 | int rnChannels = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:487:7: warning: variable 'rnChannel' set but not used [-Wunused-but-set-variable] 487 | int rnChannel = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:591:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 591 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:43:21: warning: unused function 'computeColl' [-Wunused-function] 43 | static ncclResult_t computeColl(struct ncclInfo* info /* input */, int* workFuncIndex, struct ncclWorkElem* work, struct ncclProxyOp* proxyOp /* output */); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:57:21: warning: unused function 'getLoopInfo' [-Wunused-function] 57 | static ncclResult_t getLoopInfo(struct ncclInfo* collInfo); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:745:21: warning: unused function 'getCBDCollnChannel' [-Wunused-function] 745 | static ncclResult_t getCBDCollnChannel(struct ncclKernelPlan* plan, struct ncclInfo* collInfo, int usableChannels) { | ^~~~~~~~~~~~~~~~~~ 36 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:81:5: warning: unused label 'ignore0' [-Wunused-label] 81 | ignore0:; | ^~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:380:7: warning: variable 'rnChannels' set but not used [-Wunused-but-set-variable] 380 | int rnChannels = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:487:7: warning: variable 'rnChannel' set but not used [-Wunused-but-set-variable] 487 | int rnChannel = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:591:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 591 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:43:21: warning: unused function 'computeColl' [-Wunused-function] 43 | static ncclResult_t computeColl(struct ncclInfo* info /* input */, int* workFuncIndex, struct ncclWorkElem* work, struct ncclProxyOp* proxyOp /* output */); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:57:21: warning: unused function 'getLoopInfo' [-Wunused-function] 57 | static ncclResult_t getLoopInfo(struct ncclInfo* collInfo); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:745:21: warning: unused function 'getCBDCollnChannel' [-Wunused-function] 745 | static ncclResult_t getCBDCollnChannel(struct ncclKernelPlan* plan, struct ncclInfo* collInfo, int usableChannels) { | ^~~~~~~~~~~~~~~~~~ 36 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/enqueue.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:81:5: warning: unused label 'ignore0' [-Wunused-label] 81 | ignore0:; | ^~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:380:7: warning: variable 'rnChannels' set but not used [-Wunused-but-set-variable] 380 | int rnChannels = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:487:7: warning: variable 'rnChannel' set but not used [-Wunused-but-set-variable] 487 | int rnChannel = 0; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:591:34: warning: suggest braces around initialization of subobject [-Wmissing-braces] 591 | struct ncclWorkElemP2p elem = {0}; | ^ | {} In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:11: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:21:21: warning: unused function 'collNetReduceSupport' [-Wunused-function] 21 | static ncclResult_t collNetReduceSupport(struct ncclComm* comm, ncclDataType_t dataType, ncclRedOp_t redOp, int* supported) { NCCLCHECK(comm->ncclCollNet->reduceSupport(dataType, redOp, supported)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:33:12: warning: unused function 'collNetSupport' [-Wunused-function] 33 | static int collNetSupport(struct ncclComm* comm) { return comm->ncclCollNet != nullptr ? 1 : 0; } | ^~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:15: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:209:21: warning: unused function 'ncclGdrCudaFree' [-Wunused-function] 209 | static ncclResult_t ncclGdrCudaFree(void* gdrHandle) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:43:21: warning: unused function 'computeColl' [-Wunused-function] 43 | static ncclResult_t computeColl(struct ncclInfo* info /* input */, int* workFuncIndex, struct ncclWorkElem* work, struct ncclProxyOp* proxyOp /* output */); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:57:21: warning: unused function 'getLoopInfo' [-Wunused-function] 57 | static ncclResult_t getLoopInfo(struct ncclInfo* collInfo); | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/enqueue.cc:745:21: warning: unused function 'getCBDCollnChannel' [-Wunused-function] 745 | static ncclResult_t getCBDCollnChannel(struct ncclKernelPlan* plan, struct ncclInfo* collInfo, int usableChannels) { | ^~~~~~~~~~~~~~~~~~ 36 warnings generated when compiling for host. [209/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/init.cc.o -MF CMakeFiles/rccl.dir/hipify/src/init.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/init.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1068:7: warning: variable 'nNodes' set but not used [-Wunused-but-set-variable] 1068 | int nNodes = 1; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1858:11: warning: unused variable 'stackSize' [-Wunused-variable] 1858 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1859:19: warning: unused variable 'devProp' [-Wunused-variable] 1859 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2183:26: warning: unused variable 'payload' [-Wunused-variable] 2183 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2197:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2197 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2504:26: warning: unused variable 'payload' [-Wunused-variable] 2504 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2534:26: warning: unused variable 'payload' [-Wunused-variable] 2534 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:37: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:38: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:826:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 826 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2168:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2168 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ 50 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1068:7: warning: variable 'nNodes' set but not used [-Wunused-but-set-variable] 1068 | int nNodes = 1; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1858:11: warning: unused variable 'stackSize' [-Wunused-variable] 1858 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1859:19: warning: unused variable 'devProp' [-Wunused-variable] 1859 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2183:26: warning: unused variable 'payload' [-Wunused-variable] 2183 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2197:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2197 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2504:26: warning: unused variable 'payload' [-Wunused-variable] 2504 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2534:26: warning: unused variable 'payload' [-Wunused-variable] 2534 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:37: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:38: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:826:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 826 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2168:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2168 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ 50 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1068:7: warning: variable 'nNodes' set but not used [-Wunused-but-set-variable] 1068 | int nNodes = 1; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1858:11: warning: unused variable 'stackSize' [-Wunused-variable] 1858 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1859:19: warning: unused variable 'devProp' [-Wunused-variable] 1859 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2183:26: warning: unused variable 'payload' [-Wunused-variable] 2183 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2197:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2197 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2504:26: warning: unused variable 'payload' [-Wunused-variable] 2504 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2534:26: warning: unused variable 'payload' [-Wunused-variable] 2534 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:37: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:38: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:826:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 826 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2168:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2168 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ 50 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1068:7: warning: variable 'nNodes' set but not used [-Wunused-but-set-variable] 1068 | int nNodes = 1; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1858:11: warning: unused variable 'stackSize' [-Wunused-variable] 1858 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1859:19: warning: unused variable 'devProp' [-Wunused-variable] 1859 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2183:26: warning: unused variable 'payload' [-Wunused-variable] 2183 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2197:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2197 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2504:26: warning: unused variable 'payload' [-Wunused-variable] 2504 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2534:26: warning: unused variable 'payload' [-Wunused-variable] 2534 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:37: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:38: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:826:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 826 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2168:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2168 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ 50 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1068:7: warning: variable 'nNodes' set but not used [-Wunused-but-set-variable] 1068 | int nNodes = 1; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1858:11: warning: unused variable 'stackSize' [-Wunused-variable] 1858 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1859:19: warning: unused variable 'devProp' [-Wunused-variable] 1859 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2183:26: warning: unused variable 'payload' [-Wunused-variable] 2183 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2197:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2197 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2504:26: warning: unused variable 'payload' [-Wunused-variable] 2504 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2534:26: warning: unused variable 'payload' [-Wunused-variable] 2534 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:37: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:38: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:826:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 826 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2168:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2168 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ 50 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1068:7: warning: variable 'nNodes' set but not used [-Wunused-but-set-variable] 1068 | int nNodes = 1; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1858:11: warning: unused variable 'stackSize' [-Wunused-variable] 1858 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1859:19: warning: unused variable 'devProp' [-Wunused-variable] 1859 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2183:26: warning: unused variable 'payload' [-Wunused-variable] 2183 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2197:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2197 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2504:26: warning: unused variable 'payload' [-Wunused-variable] 2504 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2534:26: warning: unused variable 'payload' [-Wunused-variable] 2534 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:37: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:38: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:826:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 826 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2168:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2168 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ 50 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:12: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1068:7: warning: variable 'nNodes' set but not used [-Wunused-but-set-variable] 1068 | int nNodes = 1; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1858:11: warning: unused variable 'stackSize' [-Wunused-variable] 1858 | int64_t stackSize; | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:1859:19: warning: unused variable 'devProp' [-Wunused-variable] 1859 | hipDeviceProp_t devProp; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2183:26: warning: unused variable 'payload' [-Wunused-variable] 2183 | NvtxParamsCommInitRank payload{myrank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2197:38: warning: unused variable 'CommInitAllSchema' [-Wunused-variable] 2197 | constexpr nvtxPayloadSchemaEntry_t CommInitAllSchema[] = { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2504:26: warning: unused variable 'payload' [-Wunused-variable] 2504 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2534:26: warning: unused variable 'payload' [-Wunused-variable] 2534 | NvtxParamsCommInitRank payload{rank, nranks, cudaDev}; | ^~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/channel.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:17: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:16:20: warning: unused function 'collNetName' [-Wunused-function] 16 | static const char* collNetName(struct ncclComm* comm) { return comm->ncclCollNet->name; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:17:21: warning: unused function 'collNetDevices' [-Wunused-function] 17 | static ncclResult_t collNetDevices(struct ncclComm* comm, int* ndev) { NCCLCHECK(comm->ncclCollNet->devices(ndev)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:18:21: warning: unused function 'collNetGetProperties' [-Wunused-function] 18 | static ncclResult_t collNetGetProperties(struct ncclComm* comm, int dev, ncclNetProperties_t* props) { NCCLCHECK(comm->ncclCollNet->getProperties(dev, props)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:19:21: warning: unused function 'collNetListen' [-Wunused-function] 19 | static ncclResult_t collNetListen(struct ncclComm* comm, int dev, void* handle, void** listenComm) { NCCLCHECK(comm->ncclCollNet->listen(dev, handle, listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:20:21: warning: unused function 'collNetConnect' [-Wunused-function] 20 | static ncclResult_t collNetConnect(struct ncclComm* comm, void* handles[], int nranks, int rank, void* listenComm, void** collComm) { NCCLCHECK(comm->ncclCollNet->connect(handles, nranks, rank, listenComm, collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:22:21: warning: unused function 'collNetRegMr' [-Wunused-function] 22 | static ncclResult_t collNetRegMr(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMr(collComm, data, size, type, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:24:21: warning: unused function 'collNetRegMrDmaBuf' [-Wunused-function] 24 | static ncclResult_t collNetRegMrDmaBuf(struct ncclComm* comm, void* collComm, void* data, size_t size, int type, uint64_t offset, int fd, void** mhandle) { NCCLCHECK(comm->ncclCollNet->regMrDmaBuf(collComm, data, size, type, offset, fd, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:25:21: warning: unused function 'collNetDeregMr' [-Wunused-function] 25 | static ncclResult_t collNetDeregMr(struct ncclComm* comm, void* collComm, void* mhandle) { NCCLCHECK(comm->ncclCollNet->deregMr(collComm, mhandle)); return ncclSuccess; } | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:26:21: warning: unused function 'collNetIallreduce' [-Wunused-function] 26 | static ncclResult_t collNetIallreduce(struct ncclComm* comm, void* collComm, void* sendData, void* recvData, int count, ncclDataType_t dataType, ncclRedOp_t redOp, void* sendMhandle, void* recvMhandle, void** request) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:28:21: warning: unused function 'collNetIflush' [-Wunused-function] 28 | static ncclResult_t collNetIflush(struct ncclComm* comm, void* collComm, void* data, int size, void* mhandle, void** request) { NCCLCHECK(comm->ncclCollNet->iflush(collComm, data, size, mhandle, request)); return ncclSuccess; } | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:29:21: warning: unused function 'collNetTest' [-Wunused-function] 29 | static ncclResult_t collNetTest(struct ncclComm* comm, void* request, int* done, int* size) { NCCLCHECK(comm->ncclCollNet->test(request, done, size)); return ncclSuccess; } | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:30:21: warning: unused function 'collNetCloseColl' [-Wunused-function] 30 | static ncclResult_t collNetCloseColl(struct ncclComm* comm, void* collComm) { NCCLCHECK(comm->ncclCollNet->closeColl(collComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/coll_net.h:31:21: warning: unused function 'collNetCloseListen' [-Wunused-function] 31 | static ncclResult_t collNetCloseListen(struct ncclComm* comm, void* listenComm) { NCCLCHECK(comm->ncclCollNet->closeListen(listenComm)); return ncclSuccess; } | ^~~~~~~~~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:37: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:38: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:826:21: warning: unused function 'collNetTrySetup' [-Wunused-function] 826 | static ncclResult_t collNetTrySetup(ncclComm_t comm, ncclComm_t parent, struct ncclTopoGraph* collNetGraph) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/init.cc:2168:36: warning: unused variable 'CommInitRankSchema' [-Wunused-const-variable] 2168 | constexpr nvtxPayloadSchemaEntry_t CommInitRankSchema[] = { | ^~~~~~~~~~~~~~~~~~ 50 warnings generated when compiling for host. [210/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/nvls.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/nvls.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. [211/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_socket.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_socket.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. [212/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/shm.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/shm.cc:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. [213/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/p2p.cc:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ 9 warnings generated when compiling for host. [214/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:29: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 18 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:29: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 18 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:29: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 18 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:29: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 18 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:29: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 18 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:29: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 18 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/net.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_ib.cc:29: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:94:21: warning: unused function 'xmlGetAttrInt' [-Wunused-function] 94 | static ncclResult_t xmlGetAttrInt(struct ncclXmlNode* node, const char* attrName, int* value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:101:21: warning: unused function 'xmlGetAttrIntDefault' [-Wunused-function] 101 | static ncclResult_t xmlGetAttrIntDefault(struct ncclXmlNode* node, const char* attrName, int* value, int defaultValue) { | ^~~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:109:21: warning: unused function 'xmlGetAttrFloat' [-Wunused-function] 109 | static ncclResult_t xmlGetAttrFloat(struct ncclXmlNode* node, const char* attrName, float* value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:116:21: warning: unused function 'xmlFindTag' [-Wunused-function] 116 | static ncclResult_t xmlFindTag(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:128:21: warning: unused function 'xmlFindTagKv' [-Wunused-function] 128 | static ncclResult_t xmlFindTagKv(struct ncclXml* xml, const char* tagName, struct ncclXmlNode** node, const char* attrName, const char* attrValue) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:144:21: warning: unused function 'xmlSetAttr' [-Wunused-function] 144 | static ncclResult_t xmlSetAttr(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:157:21: warning: unused function 'xmlSetAttrIfUnset' [-Wunused-function] 157 | static ncclResult_t xmlSetAttrIfUnset(struct ncclXmlNode* node, const char* attrName, const char* value) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:169:21: warning: unused function 'xmlSetAttrInt' [-Wunused-function] 169 | static ncclResult_t xmlSetAttrInt(struct ncclXmlNode* node, const char* attrName, const int value) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:182:21: warning: unused function 'xmlSetAttrFloat' [-Wunused-function] 182 | static ncclResult_t xmlSetAttrFloat(struct ncclXmlNode* node, const char* attrName, const float value) { | ^~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:195:21: warning: unused function 'xmlUnsetAttr' [-Wunused-function] 195 | static ncclResult_t xmlUnsetAttr(struct ncclXmlNode* node, const char* attrName) { | ^~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:207:21: warning: unused function 'xmlGetSub' [-Wunused-function] 207 | static ncclResult_t xmlGetSub(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:233:21: warning: unused function 'xmlGetSubKvInt' [-Wunused-function] 233 | static ncclResult_t xmlGetSubKvInt(struct ncclXmlNode* node, const char* subName, struct ncclXmlNode** sub, const char* attrName, const int attrValue) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:240:21: warning: unused function 'xmlAddNode' [-Wunused-function] 240 | static ncclResult_t xmlAddNode(struct ncclXml* xml, struct ncclXmlNode* parent, const char* subName, struct ncclXmlNode** sub) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:256:21: warning: unused function 'xmlRemoveNode' [-Wunused-function] 256 | static ncclResult_t xmlRemoveNode(struct ncclXmlNode* node) { | ^~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:276:21: warning: unused function 'kvConvertToInt' [-Wunused-function] 276 | static ncclResult_t kvConvertToInt(const char* str, int* value, struct kvDict* dict) { | ^~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/xml.h:289:21: warning: unused function 'kvConvertToStr' [-Wunused-function] 289 | static ncclResult_t kvConvertToStr(int value, const char** str, struct kvDict* dict) { | ^~~~~~~~~~~~~~ 18 warnings generated when compiling for host. [215/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllGather_RING_LL128_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllGather_RING_LL128_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllGather_RING_LL128_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:61:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 61 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:174:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 174 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllGather_RING_LL128_Sum_int8_t, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:61:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 61 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:174:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 174 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllGather_RING_LL128_Sum_int8_t, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [216/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllGather_RING_LL_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllGather_RING_LL_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllGather_RING_LL_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [217/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o -MF CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o.d -o CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:19: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:275:21: warning: unused function 'netDumpMap' [-Wunused-function] 275 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ 15 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:19: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:275:21: warning: unused function 'netDumpMap' [-Wunused-function] 275 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ 15 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:19: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:275:21: warning: unused function 'netDumpMap' [-Wunused-function] 275 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ 15 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:19: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:275:21: warning: unused function 'netDumpMap' [-Wunused-function] 275 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ 15 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:19: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:275:21: warning: unused function 'netDumpMap' [-Wunused-function] 275 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ 15 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:19: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:275:21: warning: unused function 'netDumpMap' [-Wunused-function] 275 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ 15 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:168:14: warning: unused variable 'info' [-Wunused-variable] 168 | gdr_info_t info; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:170:12: warning: unused variable 'mh' [-Wunused-variable] 170 | gdr_mh_t mh; | ^~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:172:9: warning: unused variable 'gdrMap' [-Wunused-variable] 172 | void *gdrMap; | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:204:19: warning: unused variable 'md' [-Wunused-variable] 204 | gdr_mem_desc_t *md = (gdr_mem_desc_t*)gdrHandle; | ^~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/gdrwrap.h:161:14: warning: unused function 'ncclGdrInit' [-Wunused-function] 161 | static gdr_t ncclGdrInit() { | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:19: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:200:21: warning: unused function 'ncclTopoIdToIndex' [-Wunused-function] 200 | static ncclResult_t ncclTopoIdToIndex(struct ncclTopoSystem* system, int type, int64_t id, int* index) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:211:21: warning: unused function 'ncclTopoRankToIndex' [-Wunused-function] 211 | static ncclResult_t ncclTopoRankToIndex(struct ncclTopoSystem* system, int rank, int* index) { | ^~~~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:222:21: warning: unused function 'ncclTopoDevToRank' [-Wunused-function] 222 | static ncclResult_t ncclTopoDevToRank(struct ncclTopoSystem* system, int dev, int* rank) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:234:14: warning: unused function 'ncclTopoXGMISpeed' [-Wunused-function] 234 | static float ncclTopoXGMISpeed(const char* gcn) { | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:250:14: warning: unused function 'ncclTopoNVLinkBw' [-Wunused-function] 250 | static float ncclTopoNVLinkBw(int cudaCompCap) { | ^~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:261:13: warning: unused function 'isPow2' [-Wunused-function] 261 | static bool isPow2(int val) { | ^~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/graph/topo.h:264:12: warning: unused function 'mirrorBits' [-Wunused-function] 264 | static int mirrorBits(int val, int pow2) { | ^~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/transport/net_tmp.cc:275:21: warning: unused function 'netDumpMap' [-Wunused-function] 275 | static ncclResult_t netDumpMap(struct connectMap* map) { | ^~~~~~~~~~ 15 warnings generated when compiling for host. [218/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [219/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [220/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [221/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [222/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [223/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/onerank.cu.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/onerank.cu.cpp:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common_kernel.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/onerank.cu.cpp:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common_kernel.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/onerank.cu.cpp:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common_kernel.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/onerank.cu.cpp:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common_kernel.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/onerank.cu.cpp:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common_kernel.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/onerank.cu.cpp:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common_kernel.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/onerank.cu.cpp:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common_kernel.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/onerank.cu.cpp:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. [224/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:61:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 61 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:160:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 160 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_int8_t, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:61:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 61 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:160:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 160 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_int8_t, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:61:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 61 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:160:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 160 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_int8_t, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:61:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 61 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:160:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 160 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_int8_t, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:61:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 61 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:160:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 160 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_int8_t, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:61:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 61 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:160:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 160 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_int8_t, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:61:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 61 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:160:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 160 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllGather_RING_SIMPLE_Sum_int8_t, ncclFuncAllGather, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_gather.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for host. [225/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 20 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 20 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [226/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [227/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 32 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 32 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [228/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [229/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.cu.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.cu.cpp:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.cu.cpp:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 2 warnings generated when compiling for host. [230/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [231/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [232/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [233/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_Prod.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [234/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [235/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [236/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [237/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1025:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 1025 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_RING_LL128_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [238/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 50 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncSum<__half>, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 50 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [239/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 50 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncProd<__half>, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 50 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [240/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMinMax<__half>, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMinMax<__half>, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMinMax<__half>, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 50 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMinMax<__half>, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMinMax<__half>, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncMinMax<__half>, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 50 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [241/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [242/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 50 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit<__half, FuncPreMulSum, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:432:9: note: in instantiation of member function 'Primitives, FanSymmetric<2>, 0, ProtoLL128, 0>::Primitives' requested here 432 | prims(tid, nthreads, tree->down, tree->down, args->sendbuff, args->recvbuff, args->redOpArg); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:472:9: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoLL128, 0>::Primitives' requested here 472 | prims(tid, nthreadsSplit, tree->down, &tree->up, args->sendbuff, args->recvbuff, args->redOpArg, 0*Proto::MaxGroupWidth); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:514:9: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoLL128, 0>::Primitives' requested here 514 | prims(tid-nthreadsSplit, nthreads-nthreadsSplit, &tree->up, tree->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:1033:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeSplit, ProtoLL128>' requested here 1033 | runTreeSplit(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:16:1: note: in instantiation of member function 'RunWork, 0, 1>::run' requested here 16 | DEFINE_ncclDevFunc(AllReduce_TREE_LL128_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 50 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [243/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [244/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [245/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [246/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [247/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [248/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [249/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [250/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [251/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [252/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [253/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [254/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_MinMax.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_MinMax.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_MinMax.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [255/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_Prod.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [256/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [257/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/Broadcast_RING_LL128_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/Broadcast_RING_LL128_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/Broadcast_RING_LL128_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:59:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 59 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:110:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 110 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(Broadcast_RING_LL128_Sum_int8_t, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:59:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 59 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:110:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 110 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(Broadcast_RING_LL128_Sum_int8_t, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [258/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/Broadcast_RING_LL_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/Broadcast_RING_LL_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/Broadcast_RING_LL_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [259/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_int8_t, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_int8_t, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_int8_t, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_int8_t, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_int8_t, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_int8_t, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:35:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 35 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:80:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 80 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllToAllPivot_RING_SIMPLE_Sum_int8_t, ncclFuncAllToAllPivot, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/alltoall_pivot.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for host. [260/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [261/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [262/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:59:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 59 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:96:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 96 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_int8_t, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:59:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 59 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:96:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 96 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_int8_t, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:59:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 59 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:96:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 96 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_int8_t, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:59:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 59 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:96:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 96 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_int8_t, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:59:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 59 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:96:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 96 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_int8_t, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:59:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 59 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:96:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 96 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_int8_t, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:7: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:59:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 59 | prims(tid, nthreads, &ring->prev, &ring->next, inputBuf, outputBuf, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:96:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 96 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Broadcast_RING_SIMPLE_Sum_int8_t, ncclFuncBroadcast, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/broadcast.h:9: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 10 warnings generated when compiling for host. [263/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_Prod.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [264/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 14 warnings generated when compiling for host. [265/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [266/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_int8_t, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_uint8_t, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_int32_t, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_uint32_t, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_int64_t, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_uint64_t, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_int8_t, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_uint8_t, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_int32_t, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_uint32_t, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_int64_t, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_LL128_SumPostDiv_uint64_t, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [267/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_int8_t, ncclFuncReduce, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_uint8_t, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_int32_t, ncclFuncReduce, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_uint32_t, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_int64_t, ncclFuncReduce, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_uint64_t, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_half, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_float, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_double, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_hip_bfloat16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_rccl_float8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_rccl_bfloat8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_int8_t, ncclFuncReduce, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_uint8_t, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_int32_t, ncclFuncReduce, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_uint32_t, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_int64_t, ncclFuncReduce, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_uint64_t, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_half, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_float, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_double, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_hip_bfloat16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_rccl_float8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Sum_rccl_bfloat8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [268/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_Prod.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_int8_t, ncclFuncReduce, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_uint8_t, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_int32_t, ncclFuncReduce, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_uint32_t, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_int64_t, ncclFuncReduce, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_uint64_t, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_half, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_float, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_double, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_hip_bfloat16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_rccl_float8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_rccl_bfloat8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_int8_t, ncclFuncReduce, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_uint8_t, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_int32_t, ncclFuncReduce, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_uint32_t, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_int64_t, ncclFuncReduce, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_uint64_t, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_half, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_float, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_double, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_hip_bfloat16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_rccl_float8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(Reduce_RING_LL128_Prod_rccl_bfloat8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [269/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_MinMax.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_MinMax.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_MinMax.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_int8_t, ncclFuncReduce, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_uint8_t, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_int32_t, ncclFuncReduce, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_uint32_t, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_int64_t, ncclFuncReduce, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_uint64_t, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_half, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_float, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_double, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_hip_bfloat16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_rccl_float8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_rccl_bfloat8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_int8_t, ncclFuncReduce, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_uint8_t, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_int32_t, ncclFuncReduce, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_uint32_t, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_int64_t, ncclFuncReduce, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_uint64_t, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_half, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_float, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_double, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_hip_bfloat16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_rccl_float8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(Reduce_RING_LL128_MinMax_rccl_bfloat8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [270/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [271/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_int8_t, ncclFuncReduce, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_uint8_t, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_int32_t, ncclFuncReduce, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_uint32_t, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_int64_t, ncclFuncReduce, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_uint64_t, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_half, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_float, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_double, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_hip_bfloat16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_rccl_float8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_rccl_bfloat8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_int8_t, ncclFuncReduce, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_uint8_t, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_int32_t, ncclFuncReduce, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_uint32_t, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_int64_t, ncclFuncReduce, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_uint64_t, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_half, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_float, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_double, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_hip_bfloat16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_rccl_float8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:77:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 77 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(Reduce_RING_LL128_PreMulSum_rccl_bfloat8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [272/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_Prod.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [273/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_MinMax.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_MinMax.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_MinMax.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [274/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [275/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [276/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_int8_t, ncclFuncReduceScatter, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_uint8_t, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_int32_t, ncclFuncReduceScatter, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_uint32_t, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_int64_t, ncclFuncReduceScatter, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_uint64_t, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_half, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_float, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_double, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_hip_bfloat16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_rccl_float8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_rccl_bfloat8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_int8_t, ncclFuncReduceScatter, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_uint8_t, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_int32_t, ncclFuncReduceScatter, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_uint32_t, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_int64_t, ncclFuncReduceScatter, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_uint64_t, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_half, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_float, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_double, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_hip_bfloat16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_rccl_float8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Sum_rccl_bfloat8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [277/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_int8_t, ncclFuncReduceScatter, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_uint8_t, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_int32_t, ncclFuncReduceScatter, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_uint32_t, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_int64_t, ncclFuncReduceScatter, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_uint64_t, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_half, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_float, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_double, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_hip_bfloat16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_rccl_float8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_rccl_bfloat8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_int8_t, ncclFuncReduceScatter, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_uint8_t, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_int32_t, ncclFuncReduceScatter, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_uint32_t, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_int64_t, ncclFuncReduceScatter, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_uint64_t, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_half, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_float, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_double, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_hip_bfloat16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_rccl_float8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_Prod_rccl_bfloat8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [278/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [279/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [280/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [281/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_int8_t, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_uint8_t, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_int32_t, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_uint32_t, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_int64_t, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_uint64_t, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_int8_t, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_uint8_t, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_int32_t, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_uint32_t, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_int64_t, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_SumPostDiv_uint64_t, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [282/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [283/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_int8_t, ncclFuncReduceScatter, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_uint8_t, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_int32_t, ncclFuncReduceScatter, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_uint32_t, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_int64_t, ncclFuncReduceScatter, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_uint64_t, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_half, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_float, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_double, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_hip_bfloat16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_rccl_float8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_rccl_bfloat8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_int8_t, ncclFuncReduceScatter, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_uint8_t, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_int32_t, ncclFuncReduceScatter, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_uint32_t, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_int64_t, ncclFuncReduceScatter, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_uint64_t, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_half, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_float, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_double, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_hip_bfloat16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_rccl_float8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_MinMax_rccl_bfloat8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [284/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 20 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 20 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 20 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 20 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 20 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 20 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 20 warnings generated when compiling for host. [285/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_int8_t, ncclFuncReduceScatter, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_uint8_t, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_int32_t, ncclFuncReduceScatter, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_uint32_t, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_int64_t, ncclFuncReduceScatter, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_uint64_t, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_half, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_float, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_double, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_hip_bfloat16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_rccl_float8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_rccl_bfloat8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_int8_t, ncclFuncReduceScatter, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_uint8_t, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_int32_t, ncclFuncReduceScatter, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_uint32_t, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_int64_t, ncclFuncReduceScatter, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_uint64_t, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_half, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_float, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_double, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_hip_bfloat16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_rccl_float8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoLL128, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:79:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoLL128>' requested here 79 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 1>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:16:1: note: in instantiation of member function 'RunWork, 1, 1>::run' requested here 16 | DEFINE_ncclDevFunc(ReduceScatter_RING_LL128_PreMulSum_rccl_bfloat8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_LL128) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 9 warnings generated when compiling for host. [286/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:216:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 216 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_int8_t, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:228:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 228 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_int8_t, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:216:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 216 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_int8_t, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:228:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 228 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_int8_t, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_int8_t, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_int8_t, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 8>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:212:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 212 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_int8_t, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 8>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:224:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 224 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_int8_t, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 8>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:212:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 212 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_int8_t, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 8>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:224:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 224 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_int8_t, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:214:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 214 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_int8_t, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1, 4>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:226:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 226 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_int8_t, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:149:62: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 149 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:216:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runRecv>' requested here 216 | runRecv>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_int8_t, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:87:62: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 1>::Primitives' requested here 87 | Primitives, 0, Proto, 1> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:228:9: note: in instantiation of function template specialization 'RunWork, 1, 2>::runSend>' requested here 228 | runSend>(tid, nthreads, group, args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(SendRecv_RING_SIMPLE_Sum_int8_t, ncclFuncSendRecv, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/sendrecv.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [287/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for host. [288/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15 warnings generated when compiling for host. [289/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_int32_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_int32_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_int32_t.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [290/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [291/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_int8_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_int8_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_int8_t.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [292/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_int64_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_int64_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_int64_t.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [293/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [294/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [295/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_float.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_float.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_float.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [296/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_half.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_half.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_half.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncSum<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [297/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_double.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_double.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_double.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [298/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_int32_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_int32_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_int32_t.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [299/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [300/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_int64_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_int64_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_int64_t.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [301/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [302/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [303/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_int8_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_int8_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_int8_t.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [304/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [305/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Sum, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [306/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [307/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int8_t, ncclFuncReduceScatter, FuncSumPostDiv, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint8_t, ncclFuncReduceScatter, FuncSumPostDiv, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int32_t, ncclFuncReduceScatter, FuncSumPostDiv, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint32_t, ncclFuncReduceScatter, FuncSumPostDiv, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_int64_t, ncclFuncReduceScatter, FuncSumPostDiv, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_SumPostDiv_uint64_t, ncclFuncReduceScatter, FuncSumPostDiv, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 15 warnings generated when compiling for host. [308/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_half.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_half.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_half.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncProd<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [309/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/git_version.cpp.o -MF CMakeFiles/rccl.dir/git_version.cpp.o.d -o CMakeFiles/rccl.dir/git_version.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/git_version.cpp [310/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_double.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_double.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_double.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [311/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_float.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_float.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_float.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [312/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/device_table.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/device_table.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/device_table.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/device_table.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/device_table.cpp:2: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for host. [313/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [314/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [315/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/host_table.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/host_table.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/host_table.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/host_table.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/host_table.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ 1 warning generated when compiling for host. [316/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [317/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [318/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint32_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [319/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, int8_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [320/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [321/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(Prod, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [322/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int8_t, ncclFuncReduce, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint8_t, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int32_t, ncclFuncReduce, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint32_t, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int64_t, ncclFuncReduce, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint64_t, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_half, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_float, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_double, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_rccl_float8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int8_t, ncclFuncReduce, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint8_t, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int32_t, ncclFuncReduce, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint32_t, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int64_t, ncclFuncReduce, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint64_t, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_half, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_float, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_double, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_rccl_float8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int8_t, ncclFuncReduce, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint8_t, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int32_t, ncclFuncReduce, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint32_t, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int64_t, ncclFuncReduce, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint64_t, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_half, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_float, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_double, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_rccl_float8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int8_t, ncclFuncReduce, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint8_t, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int32_t, ncclFuncReduce, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint32_t, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int64_t, ncclFuncReduce, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint64_t, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_half, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_float, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_double, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_rccl_float8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int8_t, ncclFuncReduce, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint8_t, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int32_t, ncclFuncReduce, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint32_t, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int64_t, ncclFuncReduce, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint64_t, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_half, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_float, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_double, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_rccl_float8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int8_t, ncclFuncReduce, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint8_t, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int32_t, ncclFuncReduce, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint32_t, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int64_t, ncclFuncReduce, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint64_t, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_half, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_float, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_double, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_rccl_float8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int8_t, ncclFuncReduce, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint8_t, ncclFuncReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int32_t, ncclFuncReduce, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint32_t, ncclFuncReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_int64_t, ncclFuncReduce, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_uint64_t, ncclFuncReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_half, ncclFuncReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_float, ncclFuncReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_double, ncclFuncReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_rccl_float8, ncclFuncReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for host. [323/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int8_t, ncclFuncReduce, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint8_t, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int32_t, ncclFuncReduce, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint32_t, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int64_t, ncclFuncReduce, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint64_t, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_half, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_float, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_double, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_rccl_float8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int8_t, ncclFuncReduce, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint8_t, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int32_t, ncclFuncReduce, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint32_t, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int64_t, ncclFuncReduce, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint64_t, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_half, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_float, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_double, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_rccl_float8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int8_t, ncclFuncReduce, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint8_t, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int32_t, ncclFuncReduce, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint32_t, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int64_t, ncclFuncReduce, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint64_t, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_half, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_float, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_double, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_rccl_float8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int8_t, ncclFuncReduce, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint8_t, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int32_t, ncclFuncReduce, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint32_t, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int64_t, ncclFuncReduce, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint64_t, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_half, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_float, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_double, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_rccl_float8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int8_t, ncclFuncReduce, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint8_t, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int32_t, ncclFuncReduce, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint32_t, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int64_t, ncclFuncReduce, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint64_t, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_half, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_float, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_double, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_rccl_float8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int8_t, ncclFuncReduce, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint8_t, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int32_t, ncclFuncReduce, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint32_t, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int64_t, ncclFuncReduce, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint64_t, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_half, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_float, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_double, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_rccl_float8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int8_t, ncclFuncReduce, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint8_t, ncclFuncReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int32_t, ncclFuncReduce, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint32_t, ncclFuncReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_int64_t, ncclFuncReduce, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_uint64_t, ncclFuncReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_half, ncclFuncReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_float, ncclFuncReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_double, ncclFuncReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_rccl_float8, ncclFuncReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for host. [324/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, uint64_t, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [325/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_float.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_float.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_float.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, float, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_float.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [326/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_double.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_double.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_double.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, double, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_double.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [327/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_half.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_half.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_half.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter<__half, FuncMinMax<__half>, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, half, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_half.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [328/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 20 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 20 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 20 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 20 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 20 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 20 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 20 warnings generated when compiling for host. [329/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int8_t, ncclFuncReduce, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint8_t, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int32_t, ncclFuncReduce, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint32_t, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int64_t, ncclFuncReduce, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint64_t, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_half, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_float, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_double, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_rccl_float8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int8_t, ncclFuncReduce, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint8_t, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int32_t, ncclFuncReduce, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint32_t, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int64_t, ncclFuncReduce, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint64_t, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_half, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_float, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_double, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_rccl_float8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int8_t, ncclFuncReduce, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint8_t, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int32_t, ncclFuncReduce, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint32_t, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int64_t, ncclFuncReduce, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint64_t, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_half, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_float, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_double, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_rccl_float8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int8_t, ncclFuncReduce, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint8_t, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int32_t, ncclFuncReduce, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint32_t, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int64_t, ncclFuncReduce, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint64_t, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_half, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_float, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_double, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_rccl_float8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int8_t, ncclFuncReduce, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint8_t, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int32_t, ncclFuncReduce, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint32_t, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int64_t, ncclFuncReduce, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint64_t, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_half, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_float, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_double, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_rccl_float8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int8_t, ncclFuncReduce, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint8_t, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int32_t, ncclFuncReduce, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint32_t, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int64_t, ncclFuncReduce, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint64_t, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_half, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_float, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_double, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_rccl_float8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int8_t, ncclFuncReduce, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint8_t, ncclFuncReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int32_t, ncclFuncReduce, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint32_t, ncclFuncReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_int64_t, ncclFuncReduce, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_uint64_t, ncclFuncReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_half, ncclFuncReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_float, ncclFuncReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_double, ncclFuncReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_rccl_float8, ncclFuncReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for host. [330/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, hip_bfloat16, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [331/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_float8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [332/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:508:29: warning: field 'group' will be initialized after field 'stepSize' [-Wreorder-ctor] 506 | tid(tid), nthreads(nthreads), wid(tid%WARP_SIZE), warp(tid/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~ | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t) 507 | warpInBlock(threadIdx.x/WARP_SIZE), | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | warp(tid/WARP_SIZE 508 | flagThread((tid%4)==3), group(group), | ~~~~~~~~~~~~~~~~~~~~~ ^~~~~~~~~~~ | warpInBlock(threadIdx.x/WARP_SIZE flagThread((tid%4)==3 509 | stepSize(ncclShmem.comm.buffSizes[NCCL_PROTO_LL128]/NCCL_STEPS/sizeof(uint64_t)) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoLL128, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoLL128, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:402:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 402 | mscclRunInterpreter, ProtoLL128, fullOps>(comm, algo, work); \ | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:217:57: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 1>, 1, ProtoSimple<2, 2>, 0>::Primitives' requested here 217 | Primitives, 1, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:3:9: note: in instantiation of function template specialization 'mscclRunInterpreter, ProtoSimple<2, 2>, false>' requested here 3 | MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE(MinMax, rccl_bfloat8, false); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:405:3: note: expanded from macro 'MSCCL_IMPL_KERNEL_ENTRY_FUNC_DEVREDOP_TYPE' 405 | mscclRunInterpreter, ProtoSimple, fullOps>(comm, algo, work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/msccl_kernel_impl.h:13: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 11 warnings generated when compiling for host. [333/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for host. [334/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int8_t, ncclFuncReduceScatter, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint8_t, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int32_t, ncclFuncReduceScatter, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint32_t, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int64_t, ncclFuncReduceScatter, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint64_t, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_half, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_float, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_double, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_rccl_float8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int8_t, ncclFuncReduceScatter, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint8_t, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int32_t, ncclFuncReduceScatter, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint32_t, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int64_t, ncclFuncReduceScatter, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint64_t, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_half, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_float, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_double, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_rccl_float8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int8_t, ncclFuncReduceScatter, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint8_t, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int32_t, ncclFuncReduceScatter, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint32_t, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int64_t, ncclFuncReduceScatter, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint64_t, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_half, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_float, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_double, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_rccl_float8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int8_t, ncclFuncReduceScatter, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint8_t, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int32_t, ncclFuncReduceScatter, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint32_t, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int64_t, ncclFuncReduceScatter, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint64_t, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_half, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_float, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_double, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_rccl_float8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int8_t, ncclFuncReduceScatter, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint8_t, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int32_t, ncclFuncReduceScatter, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint32_t, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int64_t, ncclFuncReduceScatter, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint64_t, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_half, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_float, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_double, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_rccl_float8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int8_t, ncclFuncReduceScatter, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint8_t, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int32_t, ncclFuncReduceScatter, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint32_t, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int64_t, ncclFuncReduceScatter, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint64_t, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_half, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_float, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_double, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_rccl_float8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int8_t, ncclFuncReduceScatter, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint8_t, ncclFuncReduceScatter, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int32_t, ncclFuncReduceScatter, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint32_t, ncclFuncReduceScatter, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_int64_t, ncclFuncReduceScatter, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_uint64_t, ncclFuncReduceScatter, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_half, ncclFuncReduceScatter, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_float, ncclFuncReduceScatter, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_double, ncclFuncReduceScatter, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncReduceScatter, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_rccl_float8, ncclFuncReduceScatter, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncReduceScatter, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for host. [335/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int8_t, ncclFuncReduceScatter, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint8_t, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int32_t, ncclFuncReduceScatter, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint32_t, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int64_t, ncclFuncReduceScatter, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint64_t, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_half, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_float, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_double, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_rccl_float8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int8_t, ncclFuncReduceScatter, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint8_t, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int32_t, ncclFuncReduceScatter, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint32_t, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int64_t, ncclFuncReduceScatter, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint64_t, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_half, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_float, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_double, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_rccl_float8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int8_t, ncclFuncReduceScatter, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint8_t, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int32_t, ncclFuncReduceScatter, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint32_t, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int64_t, ncclFuncReduceScatter, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint64_t, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_half, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_float, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_double, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_rccl_float8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int8_t, ncclFuncReduceScatter, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint8_t, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int32_t, ncclFuncReduceScatter, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint32_t, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int64_t, ncclFuncReduceScatter, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint64_t, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_half, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_float, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_double, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_rccl_float8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int8_t, ncclFuncReduceScatter, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint8_t, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int32_t, ncclFuncReduceScatter, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint32_t, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int64_t, ncclFuncReduceScatter, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint64_t, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_half, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_float, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_double, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_rccl_float8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int8_t, ncclFuncReduceScatter, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint8_t, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int32_t, ncclFuncReduceScatter, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint32_t, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int64_t, ncclFuncReduceScatter, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint64_t, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_half, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_float, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_double, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_rccl_float8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int8_t, ncclFuncReduceScatter, FuncProd, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint8_t, ncclFuncReduceScatter, FuncProd, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int32_t, ncclFuncReduceScatter, FuncProd, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint32_t, ncclFuncReduceScatter, FuncProd, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_int64_t, ncclFuncReduceScatter, FuncProd, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_uint64_t, ncclFuncReduceScatter, FuncProd, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncProd<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_half, ncclFuncReduceScatter, FuncProd, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_float, ncclFuncReduceScatter, FuncProd, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_double, ncclFuncReduceScatter, FuncProd, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_hip_bfloat16, ncclFuncReduceScatter, FuncProd, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_rccl_float8, ncclFuncReduceScatter, FuncProd, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_Prod_rccl_bfloat8, ncclFuncReduceScatter, FuncProd, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for host. [336/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncSum<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for host. [337/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int8_t, ncclFuncReduceScatter, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint8_t, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int32_t, ncclFuncReduceScatter, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint32_t, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int64_t, ncclFuncReduceScatter, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint64_t, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_half, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_float, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_double, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_rccl_float8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int8_t, ncclFuncReduceScatter, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint8_t, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int32_t, ncclFuncReduceScatter, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint32_t, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int64_t, ncclFuncReduceScatter, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint64_t, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_half, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_float, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_double, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_rccl_float8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int8_t, ncclFuncReduceScatter, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint8_t, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int32_t, ncclFuncReduceScatter, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint32_t, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int64_t, ncclFuncReduceScatter, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint64_t, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_half, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_float, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_double, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_rccl_float8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int8_t, ncclFuncReduceScatter, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint8_t, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int32_t, ncclFuncReduceScatter, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint32_t, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int64_t, ncclFuncReduceScatter, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint64_t, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_half, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_float, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_double, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_rccl_float8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int8_t, ncclFuncReduceScatter, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint8_t, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int32_t, ncclFuncReduceScatter, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint32_t, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int64_t, ncclFuncReduceScatter, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint64_t, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_half, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_float, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_double, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_rccl_float8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int8_t, ncclFuncReduceScatter, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint8_t, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int32_t, ncclFuncReduceScatter, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint32_t, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int64_t, ncclFuncReduceScatter, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint64_t, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_half, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_float, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_double, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_rccl_float8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int8_t, ncclFuncReduceScatter, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint8_t, ncclFuncReduceScatter, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int32_t, ncclFuncReduceScatter, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint32_t, ncclFuncReduceScatter, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_int64_t, ncclFuncReduceScatter, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_uint64_t, ncclFuncReduceScatter, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_half, ncclFuncReduceScatter, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_float, ncclFuncReduceScatter, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_double, ncclFuncReduceScatter, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncReduceScatter, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_rccl_float8, ncclFuncReduceScatter, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncReduceScatter, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for host. [338/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncMinMax<__half>, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for host. [339/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int8_t, ncclFuncReduce, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int32_t, ncclFuncReduce, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int64_t, ncclFuncReduce, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_half, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_float, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_double, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int8_t, ncclFuncReduce, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int32_t, ncclFuncReduce, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int64_t, ncclFuncReduce, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_half, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_float, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_double, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int8_t, ncclFuncReduce, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int32_t, ncclFuncReduce, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int64_t, ncclFuncReduce, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_half, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_float, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_double, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int8_t, ncclFuncReduce, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int32_t, ncclFuncReduce, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int64_t, ncclFuncReduce, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_half, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_float, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_double, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int8_t, ncclFuncReduce, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int32_t, ncclFuncReduce, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int64_t, ncclFuncReduce, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_half, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_float, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_double, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int8_t, ncclFuncReduce, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int32_t, ncclFuncReduce, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int64_t, ncclFuncReduce, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_half, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_float, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_double, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int8_t, ncclFuncReduce, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int32_t, ncclFuncReduce, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_int64_t, ncclFuncReduce, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_half, ncclFuncReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_float, ncclFuncReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_double, ncclFuncReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:33:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 33 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:63:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<1, 1>>' requested here 63 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(Reduce_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for host. [340/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 50 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 50 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 50 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 50 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 50 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 50 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int8_t, ncclFuncAllReduce, FuncSumPostDiv, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint8_t, ncclFuncAllReduce, FuncSumPostDiv, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int32_t, ncclFuncAllReduce, FuncSumPostDiv, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint32_t, ncclFuncAllReduce, FuncSumPostDiv, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_int64_t, ncclFuncAllReduce, FuncSumPostDiv, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv_uint64_t, ncclFuncAllReduce, FuncSumPostDiv, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 50 warnings generated when compiling for host. [341/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncProd<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for host. [342/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncSum<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for host. [343/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int8_t, ncclFuncReduceScatter, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int32_t, ncclFuncReduceScatter, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int64_t, ncclFuncReduceScatter, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_half, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_float, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_double, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int8_t, ncclFuncReduceScatter, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int32_t, ncclFuncReduceScatter, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int64_t, ncclFuncReduceScatter, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_half, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_float, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_double, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int8_t, ncclFuncReduceScatter, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int32_t, ncclFuncReduceScatter, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int64_t, ncclFuncReduceScatter, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_half, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_float, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_double, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int8_t, ncclFuncReduceScatter, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int32_t, ncclFuncReduceScatter, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int64_t, ncclFuncReduceScatter, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_half, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_float, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_double, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int8_t, ncclFuncReduceScatter, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int32_t, ncclFuncReduceScatter, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int64_t, ncclFuncReduceScatter, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_half, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_float, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_double, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int8_t, ncclFuncReduceScatter, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int32_t, ncclFuncReduceScatter, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int64_t, ncclFuncReduceScatter, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_half, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_float, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_double, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int8_t, ncclFuncReduceScatter, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncReduceScatter, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int32_t, ncclFuncReduceScatter, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncReduceScatter, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_int64_t, ncclFuncReduceScatter, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncReduceScatter, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_half, ncclFuncReduceScatter, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_float, ncclFuncReduceScatter, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_double, ncclFuncReduceScatter, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncReduceScatter, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncReduceScatter, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:34:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 34 | prims(tid, nthreads, &ring->prev, &ring->next, args->sendbuff, args->recvbuff, args->redOpArg, 0, args->connIndex, args->connIndex); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:65:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 65 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(ReduceScatter_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncReduceScatter, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/reduce_scatter.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 21 warnings generated when compiling for host. [344/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing<__half, FuncPreMulSum, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:71:56: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 0, ProtoSimple<2, 2>, 0>::Primitives' requested here 71 | Primitives, 0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:569:5: note: in instantiation of function template specialization '(anonymous namespace)::runRing, ProtoSimple<2, 2>>' requested here 569 | runRing(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 1, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 1, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_RING_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_RING, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for host. [345/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncMinMax<__half>, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for host. [346/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown<__half, FuncPreMulSum, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:262:90: note: in instantiation of member function 'Primitives, FanAsymmetric<2, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 262 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:311:90: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 2>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 311 | Primitives, /*Direct=*/0, Proto, 0> prims | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:576:5: note: in instantiation of function template specialization '(anonymous namespace)::runTreeUpDown, ProtoSimple<1, 1>>' requested here 576 | runTreeUpDown>(args); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 0, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 0, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_TREE_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_TREE, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 38 warnings generated when compiling for host. [347/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for host. [348/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for host. [349/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for host. [350/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:955:7: note: in instantiation of member function 'Primitives, FanSymmetric<1>, 1, ProtoSimple<1, 1>, 0>::Primitives' requested here 955 | prims(groupTid, groupNthreads, &recv, &send, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 3, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 3, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_CHAIN, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 26 warnings generated when compiling for host. [351/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int8_t, ncclFuncAllReduce, FuncSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint8_t, ncclFuncAllReduce, FuncSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int32_t, ncclFuncAllReduce, FuncSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint32_t, ncclFuncAllReduce, FuncSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_int64_t, ncclFuncAllReduce, FuncSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_uint64_t, ncclFuncAllReduce, FuncSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncSum<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_half, ncclFuncAllReduce, FuncSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_float, ncclFuncAllReduce, FuncSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_double, ncclFuncAllReduce, FuncSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_hip_bfloat16, ncclFuncAllReduce, FuncSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_float8, ncclFuncAllReduce, FuncSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Sum_rccl_bfloat8, ncclFuncAllReduce, FuncSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for host. [352/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int8_t, ncclFuncAllReduce, FuncProd, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint8_t, ncclFuncAllReduce, FuncProd, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int32_t, ncclFuncAllReduce, FuncProd, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint32_t, ncclFuncAllReduce, FuncProd, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_int64_t, ncclFuncAllReduce, FuncProd, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_uint64_t, ncclFuncAllReduce, FuncProd, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncProd<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_half, ncclFuncAllReduce, FuncProd, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_float, ncclFuncAllReduce, FuncProd, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_double, ncclFuncAllReduce, FuncProd, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_hip_bfloat16, ncclFuncAllReduce, FuncProd, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_float8, ncclFuncAllReduce, FuncProd, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_Prod_rccl_bfloat8, ncclFuncAllReduce, FuncProd, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for host. [353/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int8_t, ncclFuncAllReduce, FuncMinMax, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint8_t, ncclFuncAllReduce, FuncMinMax, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int32_t, ncclFuncAllReduce, FuncMinMax, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint32_t, ncclFuncAllReduce, FuncMinMax, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_int64_t, ncclFuncAllReduce, FuncMinMax, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_uint64_t, ncclFuncAllReduce, FuncMinMax, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncMinMax<__half>, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_half, ncclFuncAllReduce, FuncMinMax, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_float, ncclFuncAllReduce, FuncMinMax, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_double, ncclFuncAllReduce, FuncMinMax, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_hip_bfloat16, ncclFuncAllReduce, FuncMinMax, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_float8, ncclFuncAllReduce, FuncMinMax, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_MinMax_rccl_bfloat8, ncclFuncAllReduce, FuncMinMax, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for host. [354/356] /usr/bin/hipcc -DCOMPILE_MSCCL_KERNEL -DENABLE_COLLTRACE -DENABLE_LL128 -DHIP_CONTIGUOUS_MEMORY -DHIP_UNCACHED_MEMORY -DNVTX_DISABLE -DNVTX_NO_IMPL -DROCM_VERSION=60201 -DROCTX_NO_IMPL -DUSE_PROF_API=1 -DUSE_ROCM_SMI64CONFIG -DUSE_ROCM_SMI_THREAD_ONLY_MUTEX -D__HIP_PLATFORM_AMD__=1 -Drccl_EXPORTS -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device -I/builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/network/unpack -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -std=c++14 -fPIC -Werror=uninitialized -Werror=sometimes-uninitialized -Wno-format-nonliteral -fgpu-rdc -fvisibility=hidden -mllvm --amdgpu-kernarg-preload-count=16 -x hip --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -MD -MT CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp.o -MF CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp.o.d -o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp.o -c /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx900. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx906. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx908. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx90a. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for gfx942. In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:8: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/device.h:13: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/rccl_float8.h:76:18: warning: unused variable 'y' [-Wunused-variable] 76 | uint32_t y, head, mantissa; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:168: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:14: warning: unused variable 'data1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:21: warning: unused variable 'flag1' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:28: warning: unused variable 'data2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:140:35: warning: unused variable 'flag2' [-Wunused-variable] 140 | uint32_t data1, flag1, data2, flag2; | ^~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll.h:532:9: warning: variable 'offset' set but not used [-Wunused-but-set-variable] 532 | int offset = tid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:169: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:270:19: warning: unused variable 'ptr' [-Wunused-variable] 270 | uint64_t* ptr = recvPtr(0)+ll128Offset; | ^~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_ll128.h:385:9: warning: variable 'wireOffset' set but not used [-Wunused-but-set-variable] 385 | int wireOffset = WireWordPerSlice*warp + 2*wid; | ^ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:33:19: warning: unused variable 'size' [-Wunused-variable] 33 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:63:9: warning: variable 'minChunkSize' set but not used [-Wunused-but-set-variable] 63 | int minChunkSize; | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:231:19: warning: unused variable 'size' [-Wunused-variable] 231 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:380:19: warning: unused variable 'size' [-Wunused-variable] 380 | const ssize_t size = args->count; | ^~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:381:15: warning: unused variable 'bid' [-Wunused-variable] 381 | const int bid = gridOffset / channelCount; | ^~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:167: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:4:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 4 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int8_t, ncclFuncAllReduce, FuncPreMulSum, int8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:5:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 5 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint8_t, ncclFuncAllReduce, FuncPreMulSum, uint8_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:6:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 6 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int32_t, ncclFuncAllReduce, FuncPreMulSum, int32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:7:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 7 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint32_t, ncclFuncAllReduce, FuncPreMulSum, uint32_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:8:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 8 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_int64_t, ncclFuncAllReduce, FuncPreMulSum, int64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:9:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 9 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_uint64_t, ncclFuncAllReduce, FuncPreMulSum, uint64_t, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives<__half, FuncPreMulSum, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:10:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 10 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_half, ncclFuncAllReduce, FuncPreMulSum, half, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:11:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 11 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_float, ncclFuncAllReduce, FuncPreMulSum, float, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:12:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 12 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_double, ncclFuncAllReduce, FuncPreMulSum, double, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:13:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 13 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_hip_bfloat16, ncclFuncAllReduce, FuncPreMulSum, hip_bfloat16, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:14:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 14 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_float8, ncclFuncAllReduce, FuncPreMulSum, rccl_float8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:607:9: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 607 | prims(tid-tidStartScatter, nThreadsScatter, NULL, direct->up, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:622:11: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 622 | prims(tid-tidStartReduce, nThreadsReduce, direct->down, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:636:11: note: in instantiation of member function 'Primitives, FanAsymmetric<0, 1>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 636 | prims(tid-tidStartReduce, nThreadsReduce, nullptr, &direct->out, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:647:9: note: in instantiation of member function 'Primitives, FanAsymmetric<7, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 647 | prims(tid, nThreadsGather, direct->up, NULL, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:658:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 7>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 658 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, direct->down, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: warning: initializer order does not match the declaration order [-Wreorder-ctor] 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ ~~~~~~~~~~~~~~~~~~~~~~ ~~~~~~~~~~~ | tidInBlock(threadIdx.x nthreads(nthreads stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_ 641 | stepSize(stepSize_ == 0 ? ncclShmem.comm.buffSizes[NCCL_PROTO_SIMPLE]/NCCL_STEPS/sizeof(T) : stepSize_) { | ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | group(group /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:668:11: note: in instantiation of member function 'Primitives, FanAsymmetric<1, 0>, 0, ProtoSimple<1, 1>, 0>::Primitives' requested here 668 | prims(tid-tidStartBcast, nThreadsBcast, &direct->out, nullptr, args->sendbuff, args->recvbuff, | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:202:53: note: in instantiation of member function 'RunWorkElement, 2, 2>::run' requested here 202 | RunWorkElement().run(we); | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:15:1: note: in instantiation of member function 'RunWork, 2, 2>::run' requested here 15 | DEFINE_ncclDevFunc(AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum_rccl_bfloat8, ncclFuncAllReduce, FuncPreMulSum, rccl_bfloat8, NCCL_ALGO_COLLNET_DIRECT, NCCL_PROTO_SIMPLE) | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:410:49: note: expanded from macro 'DEFINE_ncclDevFunc' 410 | RunWork, algo, proto>().run(&ncclShmem.work); \ | ^ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:15: note: field 'nthreads' will be initialized after field 'tidInBlock' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~~~~~~~ /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/prims_simple.h:640:60: note: field 'group' will be initialized after field 'stepSize' 640 | tid(tid), nthreads(nthreads), tidInBlock(threadIdx.x), group(group), | ^~~~~~~~~~~ In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp:1: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/all_reduce.h:10: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/primitives.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/device/common.h:17: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/comm.h:11: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/transport.h:12: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/graph.h:126: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/info.h:14: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/core.h:37: In file included from /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/alloc.h:14: /builddir/build/BUILD/rccl-6.2.1-build/rccl-rocm-6.2.1/redhat-linux-build-gfx9/hipify/src/include/utils.h:46:13: warning: unused function 'log2i' [-Wunused-function] 46 | static long log2i(long n) { | ^~~~~ 86 warnings generated when compiling for host. [355/356] : && /usr/bin/cmake -E time /usr/bin/hipcc -fPIC -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes -Xoffload-linker -mllvm=-amdgpu-kernarg-preload-count=16 -Xlinker --dependency-file=CMakeFiles/rccl.dir/link.d -shared -Wl,-soname,librccl.so.1 -o librccl.so.1.0 CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o CMakeFiles/rccl.dir/hipify/src/channel.cc.o CMakeFiles/rccl.dir/hipify/src/collectives.cc.o CMakeFiles/rccl.dir/hipify/src/debug.cc.o CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o CMakeFiles/rccl.dir/hipify/src/group.cc.o CMakeFiles/rccl.dir/hipify/src/init.cc.o CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o CMakeFiles/rccl.dir/hipify/src/net.cc.o CMakeFiles/rccl.dir/hipify/src/msccl.cc.o CMakeFiles/rccl.dir/hipify/src/proxy.cc.o CMakeFiles/rccl.dir/hipify/src/register.cc.o CMakeFiles/rccl.dir/hipify/src/transport.cc.o CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o CMakeFiles/rccl.dir/hipify/src/device/AllGather_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllGather_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Broadcast_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Broadcast_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_int8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_int32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_int64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_half.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_float.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_double.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_int8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_int32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_int64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_half.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_float.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_double.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_half.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_float.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_double.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp.o CMakeFiles/rccl.dir/hipify/src/device/device_table.cpp.o CMakeFiles/rccl.dir/hipify/src/device/host_table.cpp.o CMakeFiles/rccl.dir/git_version.cpp.o -fgpu-rdc -ldl /usr/lib64/librocm_smi64.so.1.0 /usr/lib64/libamdhip64.so.6.3.42131 --hip-link --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -lpthread -lrt -ldl && : FAILED: librccl.so.1.0 : && /usr/bin/cmake -E time /usr/bin/hipcc -fPIC -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes -Xoffload-linker -mllvm=-amdgpu-kernarg-preload-count=16 -Xlinker --dependency-file=CMakeFiles/rccl.dir/link.d -shared -Wl,-soname,librccl.so.1 -o librccl.so.1.0 CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o CMakeFiles/rccl.dir/hipify/src/channel.cc.o CMakeFiles/rccl.dir/hipify/src/collectives.cc.o CMakeFiles/rccl.dir/hipify/src/debug.cc.o CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o CMakeFiles/rccl.dir/hipify/src/group.cc.o CMakeFiles/rccl.dir/hipify/src/init.cc.o CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o CMakeFiles/rccl.dir/hipify/src/net.cc.o CMakeFiles/rccl.dir/hipify/src/msccl.cc.o CMakeFiles/rccl.dir/hipify/src/proxy.cc.o CMakeFiles/rccl.dir/hipify/src/register.cc.o CMakeFiles/rccl.dir/hipify/src/transport.cc.o CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o CMakeFiles/rccl.dir/hipify/src/device/AllGather_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllGather_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Broadcast_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Broadcast_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_int8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_int32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_int64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_half.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_float.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_double.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_int8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_int32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_int64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_half.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_float.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_double.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_half.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_float.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_double.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp.o CMakeFiles/rccl.dir/hipify/src/device/device_table.cpp.o CMakeFiles/rccl.dir/hipify/src/device/host_table.cpp.o CMakeFiles/rccl.dir/git_version.cpp.o -fgpu-rdc -ldl /usr/lib64/librocm_smi64.so.1.0 /usr/lib64/libamdhip64.so.6.3.42131 --hip-link --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -lpthread -lrt -ldl && : clang++: warning: argument unused during compilation: '-Xarch_host -fstack-protector-strong' [-Wunused-command-line-argument] clang++: warning: argument unused during compilation: '-Xarch_host -fcf-protection' [-Wunused-command-line-argument] clang++: warning: argument unused during compilation: '-specs=/usr/lib/rpm/redhat/redhat-package-notes' [-Wunused-command-line-argument] ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_87480c4326bf9436 >>> referenced by common.cu.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by common.cu.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by common.cu.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_fc4a99094279e396 >>> referenced by onerank.cu.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by onerank.cu.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by onerank.cu.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_495b272fd4f26c7e >>> referenced by msccl_kernel_MinMax_rccl_bfloat8.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_rccl_bfloat8.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_rccl_bfloat8.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_7771d400933336d4 >>> referenced by msccl_kernel_MinMax_rccl_float8.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_rccl_float8.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_rccl_float8.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_bcf008cfe309c491 >>> referenced by msccl_kernel_MinMax_hip_bfloat16.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_hip_bfloat16.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_hip_bfloat16.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_20827df9eb0d937e >>> referenced by msccl_kernel_MinMax_double.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_double.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_double.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_d815211f736711ad >>> referenced by msccl_kernel_MinMax_float.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_float.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_float.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_5fea838610fdd9c1 >>> referenced by msccl_kernel_MinMax_int64_t.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_int64_t.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_int64_t.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_aee3d52e220a36c0 >>> referenced by msccl_kernel_MinMax_uint64_t.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_uint64_t.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_uint64_t.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_97b8e853e61926b3 >>> referenced by msccl_kernel_MinMax_uint32_t.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_uint32_t.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_uint32_t.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_3809467a73585689 >>> referenced by msccl_kernel_MinMax_half.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_half.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_half.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_28156b0450e3debd >>> referenced by msccl_kernel_MinMax_uint8_t.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_uint8_t.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_uint8_t.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_eb7803f13afd4f6b >>> referenced by msccl_kernel_MinMax_int32_t.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_int32_t.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_int32_t.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_dd3ebf7f6d613e3 >>> referenced by msccl_kernel_Prod_rccl_bfloat8.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_Prod_rccl_bfloat8.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_Prod_rccl_bfloat8.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_896198d10faa6708 >>> referenced by msccl_kernel_MinMax_int8_t.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_int8_t.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_MinMax_int8_t.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_fd5f732175f56260 >>> referenced by msccl_kernel_Prod_rccl_float8.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_Prod_rccl_float8.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_Prod_rccl_float8.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_e08bfce87d6b9a01 >>> referenced by msccl_kernel_Prod_hip_bfloat16.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_Prod_hip_bfloat16.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_Prod_hip_bfloat16.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_c9490a52fef55810 >>> referenced by msccl_kernel_Prod_double.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_Prod_double.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_Prod_double.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_adbdddbba311c003 >>> referenced by msccl_kernel_Prod_uint64_t.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_Prod_uint64_t.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_Prod_uint64_t.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: undefined hidden symbol: __hip_gpubin_handle_8a0f027758b01602 >>> referenced by msccl_kernel_Prod_float.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_Prod_float.cpp >>> lto.tmp:(__hip_module_ctor) >>> referenced by msccl_kernel_Prod_float.cpp >>> lto.tmp:(__hip_module_dtor) >>> referenced 1 more times ld.lld: error: too many errors emitted, stopping now (use --error-limit=0 to see all errors) clang++: error: linker command failed with exit code 1 (use -v to see invocation) failed to execute:/usr/lib64/rocm/llvm/bin/clang++ --driver-mode=g++ --hip-link --offload-arch=gfx900 --offload-arch=gfx906:xnack- --offload-arch=gfx908:xnack- --offload-arch=gfx90a:xnack+ --offload-arch=gfx90a:xnack- --offload-arch=gfx942 -fPIC -O2 -flto=thin -fexceptions -g -grecord-gcc-switches -pipe -Wall -Werror=format-security -Wp,-U_FORTIFY_SOURCE,-D_FORTIFY_SOURCE=3 -Wp,-D_GLIBCXX_ASSERTIONS --config /usr/lib/rpm/redhat/redhat-hardened-clang.cfg -Xarch_host -fstack-protector-strong -m64 -march=x86-64 -mtune=generic -fasynchronous-unwind-tables -fstack-clash-protection -Xarch_host -fcf-protection -fno-omit-frame-pointer -mno-omit-leaf-frame-pointer -O2 -g -DNDEBUG -Wl,-z,relro -Wl,--as-needed -Wl,-z,pack-relative-relocs -Wl,-z,now -Wl,-z,now -Wl,--build-id=sha1 -specs=/usr/lib/rpm/redhat/redhat-package-notes -Xoffload-linker -mllvm=-amdgpu-kernarg-preload-count=16 -Xlinker --dependency-file=CMakeFiles/rccl.dir/link.d -shared -Wl,-soname,librccl.so.1 -o "librccl.so.1.0" CMakeFiles/rccl.dir/hipify/src/bootstrap.cc.o CMakeFiles/rccl.dir/hipify/src/channel.cc.o CMakeFiles/rccl.dir/hipify/src/collectives.cc.o CMakeFiles/rccl.dir/hipify/src/debug.cc.o CMakeFiles/rccl.dir/hipify/src/enqueue.cc.o CMakeFiles/rccl.dir/hipify/src/group.cc.o CMakeFiles/rccl.dir/hipify/src/init.cc.o CMakeFiles/rccl.dir/hipify/src/init_nvtx.cc.o CMakeFiles/rccl.dir/hipify/src/net.cc.o CMakeFiles/rccl.dir/hipify/src/msccl.cc.o CMakeFiles/rccl.dir/hipify/src/proxy.cc.o CMakeFiles/rccl.dir/hipify/src/register.cc.o CMakeFiles/rccl.dir/hipify/src/transport.cc.o CMakeFiles/rccl.dir/hipify/src/device/common.cu.cpp.o CMakeFiles/rccl.dir/hipify/src/device/onerank.cu.cpp.o CMakeFiles/rccl.dir/hipify/src/graph/connect.cc.o CMakeFiles/rccl.dir/hipify/src/graph/paths.cc.o CMakeFiles/rccl.dir/hipify/src/graph/rings.cc.o CMakeFiles/rccl.dir/hipify/src/graph/rome_models.cc.o CMakeFiles/rccl.dir/hipify/src/graph/search.cc.o CMakeFiles/rccl.dir/hipify/src/graph/topo.cc.o CMakeFiles/rccl.dir/hipify/src/graph/trees.cc.o CMakeFiles/rccl.dir/hipify/src/graph/tuning.cc.o CMakeFiles/rccl.dir/hipify/src/graph/xml.cc.o CMakeFiles/rccl.dir/hipify/src/misc/alt_rsmi.cc.o CMakeFiles/rccl.dir/hipify/src/misc/archinfo.cc.o CMakeFiles/rccl.dir/hipify/src/misc/argcheck.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ibvsymbols.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ibvwrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/ipcsocket.cc.o CMakeFiles/rccl.dir/hipify/src/misc/npkit.cc.o CMakeFiles/rccl.dir/hipify/src/misc/nvmlwrap_stub.cc.o CMakeFiles/rccl.dir/hipify/src/misc/param.cc.o CMakeFiles/rccl.dir/hipify/src/misc/profiler.cc.o CMakeFiles/rccl.dir/hipify/src/misc/rocm_smi_wrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/rocmwrap.cc.o CMakeFiles/rccl.dir/hipify/src/misc/roctx.cc.o CMakeFiles/rccl.dir/hipify/src/misc/shmutils.cc.o CMakeFiles/rccl.dir/hipify/src/misc/signals.cc.o CMakeFiles/rccl.dir/hipify/src/misc/socket.cc.o CMakeFiles/rccl.dir/hipify/src/misc/strongstream.cc.o CMakeFiles/rccl.dir/hipify/src/misc/tuner.cc.o CMakeFiles/rccl.dir/hipify/src/misc/utils.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_lifecycle.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_parser.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_setup.cc.o CMakeFiles/rccl.dir/hipify/src/misc/msccl/msccl_status.cc.o CMakeFiles/rccl.dir/hipify/src/transport/coll_net.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_tmp.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_ib.cc.o CMakeFiles/rccl.dir/hipify/src/transport/net_socket.cc.o CMakeFiles/rccl.dir/hipify/src/transport/nvls.cc.o CMakeFiles/rccl.dir/hipify/src/transport/p2p.cc.o CMakeFiles/rccl.dir/hipify/src/transport/shm.cc.o CMakeFiles/rccl.dir/hipify/src/device/AllGather_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllGather_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllGather_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_TREE_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_RING_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_DIRECT_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllReduce_COLLNET_CHAIN_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/AllToAllPivot_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Broadcast_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Broadcast_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Broadcast_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/Reduce_RING_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_LL128_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_Prod.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_MinMax.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_PreMulSum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/ReduceScatter_RING_SIMPLE_SumPostDiv.cpp.o CMakeFiles/rccl.dir/hipify/src/device/SendRecv_RING_SIMPLE_Sum.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_int8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_uint8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_int32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_uint32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_int64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_uint64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_half.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_float.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_double.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_hip_bfloat16.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_rccl_float8.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Sum_rccl_bfloat8.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_int8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_uint8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_int32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_uint32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_int64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_uint64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_half.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_float.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_double.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_hip_bfloat16.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_rccl_float8.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_Prod_rccl_bfloat8.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_int8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_uint8_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_int32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_uint32_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_int64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_uint64_t.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_half.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_float.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_double.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_hip_bfloat16.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_rccl_float8.cpp.o CMakeFiles/rccl.dir/hipify/src/device/msccl_kernel_MinMax_rccl_bfloat8.cpp.o CMakeFiles/rccl.dir/hipify/src/device/device_table.cpp.o CMakeFiles/rccl.dir/hipify/src/device/host_table.cpp.o CMakeFiles/rccl.dir/git_version.cpp.o -fgpu-rdc -ldl /usr/lib64/librocm_smi64.so.1.0 /usr/lib64/libamdhip64.so.6.3.42131 --hip-link -lpthread -lrt -ldl Elapsed time (seconds): 3940.17 ninja: build stopped: subcommand failed. RPM build errors: error: Bad exit status from /var/tmp/rpm-tmp.wc12qt (%build) Bad exit status from /var/tmp/rpm-tmp.wc12qt (%build) Child return code was: 1 EXCEPTION: [Error('Command failed: \n # /usr/bin/systemd-nspawn -q -M 2d2fd6b0534047fbbc531e2c72c9db62 -D /var/lib/mock/f42-build-55706471-6538073/root -a -u mockbuild --capability=cap_ipc_lock --bind=/tmp/mock-resolv.vcer5xhi:/etc/resolv.conf --bind=/dev/btrfs-control --bind=/dev/mapper/control --bind=/dev/fuse --bind=/dev/loop-control --bind=/dev/loop0 --bind=/dev/loop1 --bind=/dev/loop2 --bind=/dev/loop3 --bind=/dev/loop4 --bind=/dev/loop5 --bind=/dev/loop6 --bind=/dev/loop7 --bind=/dev/loop8 --bind=/dev/loop9 --bind=/dev/loop10 --bind=/dev/loop11 --console=pipe --setenv=TERM=vt100 --setenv=SHELL=/bin/bash --setenv=HOME=/builddir --setenv=HOSTNAME=mock --setenv=PATH=/usr/bin:/bin:/usr/sbin:/sbin \'--setenv=PROMPT_COMMAND=printf "\\033]0;\\007"\' \'--setenv=PS1= \\s-\\v\\$ \' --setenv=LANG=C.UTF-8 --resolv-conf=off bash --login -c \'/usr/bin/rpmbuild -bb --noclean --target x86_64 --nodeps /builddir/build/SPECS/rccl.spec\'\n', 1)] Traceback (most recent call last): File "/usr/lib/python3.13/site-packages/mockbuild/trace_decorator.py", line 93, in trace result = func(*args, **kw) File "/usr/lib/python3.13/site-packages/mockbuild/util.py", line 610, in do_with_status raise exception.Error("Command failed: \n # %s\n%s" % (cmd_pretty(command, env), output), child.returncode) mockbuild.exception.Error: Command failed: # /usr/bin/systemd-nspawn -q -M 2d2fd6b0534047fbbc531e2c72c9db62 -D /var/lib/mock/f42-build-55706471-6538073/root -a -u mockbuild --capability=cap_ipc_lock --bind=/tmp/mock-resolv.vcer5xhi:/etc/resolv.conf --bind=/dev/btrfs-control --bind=/dev/mapper/control --bind=/dev/fuse --bind=/dev/loop-control --bind=/dev/loop0 --bind=/dev/loop1 --bind=/dev/loop2 --bind=/dev/loop3 --bind=/dev/loop4 --bind=/dev/loop5 --bind=/dev/loop6 --bind=/dev/loop7 --bind=/dev/loop8 --bind=/dev/loop9 --bind=/dev/loop10 --bind=/dev/loop11 --console=pipe --setenv=TERM=vt100 --setenv=SHELL=/bin/bash --setenv=HOME=/builddir --setenv=HOSTNAME=mock --setenv=PATH=/usr/bin:/bin:/usr/sbin:/sbin '--setenv=PROMPT_COMMAND=printf "\033]0;\007"' '--setenv=PS1= \s-\v\$ ' --setenv=LANG=C.UTF-8 --resolv-conf=off bash --login -c '/usr/bin/rpmbuild -bb --noclean --target x86_64 --nodeps /builddir/build/SPECS/rccl.spec'